corda/src/compile.cpp

10269 lines
279 KiB
C++
Raw Normal View History

2014-04-21 02:14:48 +00:00
/* Copyright (c) 2008-2014, Avian Contributors
Permission to use, copy, modify, and/or distribute this software
for any purpose with or without fee is hereby granted, provided
that the above copyright notice and this permission notice appear
in all copies.
There is NO WARRANTY for this software. See license.txt for
details. */
#include "avian/machine.h"
#include "avian/util.h"
#include "avian/alloc-vector.h"
#include "avian/process.h"
#include "avian/target.h"
#include "avian/arch.h"
#include <avian/system/memory.h>
#include <avian/codegen/assembler.h>
#include <avian/codegen/architecture.h>
#include <avian/codegen/compiler.h>
#include <avian/codegen/targets.h>
#include <avian/codegen/lir.h>
#include <avian/codegen/runtime.h>
2013-02-20 05:12:28 +00:00
2013-02-20 05:56:05 +00:00
#include <avian/util/runtime-array.h>
#include <avian/util/list.h>
2014-02-25 22:46:35 +00:00
#include <avian/util/slice.h>
2014-02-25 22:15:37 +00:00
#include <avian/util/fixed-allocator.h>
#include "debug-util.h"
using namespace vm;
2014-07-11 15:50:18 +00:00
extern "C" uint64_t vmInvoke(void* thread,
void* function,
void* arguments,
unsigned argumentFootprint,
unsigned frameSize,
unsigned returnType);
2014-07-11 15:50:18 +00:00
extern "C" void vmInvoke_returnAddress();
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
2014-07-11 15:50:18 +00:00
extern "C" void vmInvoke_safeStack();
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
2014-07-11 15:50:18 +00:00
extern "C" void vmJumpAndInvoke(void* thread,
void* function,
void* stack,
unsigned argumentFootprint,
uintptr_t* arguments,
unsigned frameSize);
2009-05-05 01:04:17 +00:00
using namespace avian::codegen;
2014-02-22 00:06:17 +00:00
using namespace avian::system;
namespace {
namespace local {
2011-02-02 15:32:40 +00:00
const bool DebugCompile = false;
const bool DebugNatives = false;
const bool DebugCallTable = false;
const bool DebugMethodTree = false;
const bool DebugInstructions = false;
2007-12-11 23:52:28 +00:00
#ifndef AVIAN_AOT_ONLY
const bool DebugFrameMaps = false;
const bool CheckArrayBounds = true;
const unsigned ExecutableAreaSizeInBytes = 30 * 1024 * 1024;
#endif
#ifdef AVIAN_CONTINUATIONS
const bool Continuations = true;
#else
const bool Continuations = false;
#endif
const unsigned MaxNativeCallFootprint = TargetBytesPerWord == 8 ? 4 : 5;
const unsigned InitialZoneCapacityInBytes = 64 * 1024;
enum ThunkIndex {
compileMethodIndex,
compileVirtualMethodIndex,
invokeNativeIndex,
throwArrayIndexOutOfBoundsIndex,
throwStackOverflowIndex,
#define THUNK(s) s##Index,
#include "thunks.cpp"
#undef THUNK
dummyIndex
};
2014-07-11 15:50:18 +00:00
inline bool isVmInvokeUnsafeStack(void* ip)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
return reinterpret_cast<uintptr_t>(ip)
2014-07-11 15:50:18 +00:00
>= reinterpret_cast<uintptr_t>(voidPointer(vmInvoke_returnAddress))
and reinterpret_cast<uintptr_t>(ip)
< reinterpret_cast<uintptr_t>(voidPointer(vmInvoke_safeStack));
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
}
class MyThread;
2014-07-11 15:50:18 +00:00
void* getIp(MyThread*);
2014-07-11 15:50:18 +00:00
class MyThread : public Thread {
2007-12-09 22:45:43 +00:00
public:
class CallTrace {
public:
2014-07-11 15:47:57 +00:00
CallTrace(MyThread* t, GcMethod* method)
: t(t),
ip(getIp(t)),
stack(t->stack),
scratch(t->scratch),
continuation(t->continuation),
nativeMethod((method->flags() & ACC_NATIVE) ? method : 0),
targetMethod(0),
originalMethod(method),
next(t->trace)
2007-12-09 22:45:43 +00:00
{
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
doTransition(t, 0, 0, 0, this);
2007-12-09 22:45:43 +00:00
}
2007-09-30 15:52:21 +00:00
2014-07-11 15:50:18 +00:00
~CallTrace()
{
assertT(t, t->stack == 0);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
t->scratch = scratch;
doTransition(t, ip, stack, continuation, next);
2007-12-09 22:45:43 +00:00
}
2007-09-25 23:53:11 +00:00
2007-12-09 22:45:43 +00:00
MyThread* t;
void* ip;
2008-08-16 18:46:14 +00:00
void* stack;
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
void* scratch;
2014-06-29 03:50:32 +00:00
GcContinuation* continuation;
2014-05-29 04:17:25 +00:00
GcMethod* nativeMethod;
GcMethod* targetMethod;
GcMethod* originalMethod;
2007-12-09 22:45:43 +00:00
CallTrace* next;
};
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
class Context {
public:
2014-07-11 15:50:18 +00:00
class MyProtector : public Thread::Protector {
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
public:
2014-07-11 15:50:18 +00:00
MyProtector(MyThread* t, Context* context)
: Protector(t), context(context)
{
}
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
2014-07-11 15:50:18 +00:00
virtual void visit(Heap::Visitor* v)
{
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
v->visit(&(context->continuation));
}
Context* context;
};
2014-07-11 15:47:57 +00:00
Context(MyThread* t,
void* ip,
void* stack,
GcContinuation* continuation,
CallTrace* trace)
: ip(ip),
stack(stack),
continuation(continuation),
trace(trace),
protector(t, this)
2014-07-11 15:50:18 +00:00
{
}
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
void* ip;
void* stack;
2014-06-29 03:50:32 +00:00
GcContinuation* continuation;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
CallTrace* trace;
MyProtector protector;
};
2014-07-11 15:50:18 +00:00
class TraceContext : public Context {
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
public:
2014-07-11 15:47:57 +00:00
TraceContext(MyThread* t,
void* ip,
void* stack,
GcContinuation* continuation,
CallTrace* trace)
: Context(t, ip, stack, continuation, trace),
t(t),
link(0),
next(t->traceContext),
methodIsMostRecent(false)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
t->traceContext = this;
}
2014-07-11 15:50:18 +00:00
TraceContext(MyThread* t, void* link)
: Context(t, t->ip, t->stack, t->continuation, t->trace),
t(t),
link(link),
next(t->traceContext),
methodIsMostRecent(false)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
t->traceContext = this;
}
2014-07-11 15:50:18 +00:00
~TraceContext()
{
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
t->traceContext = next;
}
MyThread* t;
void* link;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
TraceContext* next;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
bool methodIsMostRecent;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
};
2014-07-11 15:47:57 +00:00
static void doTransition(MyThread* t,
void* ip,
void* stack,
GcContinuation* continuation,
MyThread::CallTrace* trace)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
// in this function, we "atomically" update the thread context
// fields in such a way to ensure that another thread may
// interrupt us at any time and still get a consistent, accurate
// stack trace. See MyProcessor::getStackTrace for details.
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
assertT(t, t->transition == 0);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
Context c(t, ip, stack, continuation, trace);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
compileTimeMemoryBarrier();
t->transition = &c;
compileTimeMemoryBarrier();
t->ip = ip;
t->stack = stack;
t->continuation = continuation;
t->trace = trace;
compileTimeMemoryBarrier();
t->transition = 0;
}
2014-07-11 15:47:57 +00:00
MyThread(Machine* m,
GcThread* javaThread,
MyThread* parent,
bool useNativeFeatures)
: Thread(m, javaThread, parent),
ip(0),
stack(0),
newStack(0),
scratch(0),
continuation(0),
exceptionStackAdjustment(0),
exceptionOffset(0),
exceptionHandler(0),
tailAddress(0),
virtualCallTarget(0),
virtualCallIndex(0),
heapImage(0),
codeImage(0),
thunkTable(0),
trace(0),
reference(0),
arch(parent ? parent->arch : avian::codegen::makeArchitectureNative(
m->system,
useNativeFeatures)),
transition(0),
traceContext(0),
stackLimit(0),
referenceFrame(0),
methodLockIsClean(true)
{
arch->acquire();
}
2007-10-03 00:22:48 +00:00
2007-12-30 22:24:48 +00:00
void* ip;
2008-08-16 18:46:14 +00:00
void* stack;
void* newStack;
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
void* scratch;
2014-06-29 03:50:32 +00:00
GcContinuation* continuation;
2009-05-25 04:27:50 +00:00
uintptr_t exceptionStackAdjustment;
2009-05-03 20:57:11 +00:00
uintptr_t exceptionOffset;
void* exceptionHandler;
void* tailAddress;
2009-05-03 20:57:11 +00:00
void* virtualCallTarget;
uintptr_t virtualCallIndex;
uintptr_t* heapImage;
uint8_t* codeImage;
void** thunkTable;
2007-12-09 22:45:43 +00:00
CallTrace* trace;
Reference* reference;
2013-02-24 06:03:01 +00:00
avian::codegen::Architecture* arch;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
Context* transition;
TraceContext* traceContext;
uintptr_t stackLimit;
List<Reference*>* referenceFrame;
bool methodLockIsClean;
2007-12-09 22:45:43 +00:00
};
2014-07-11 15:47:57 +00:00
void transition(MyThread* t,
void* ip,
void* stack,
GcContinuation* continuation,
MyThread::CallTrace* trace)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
MyThread::doTransition(t, ip, stack, continuation, trace);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
}
2014-07-11 15:50:18 +00:00
object resolveThisPointer(MyThread* t, void* stack)
2007-12-09 22:45:43 +00:00
{
2014-07-11 15:50:18 +00:00
return reinterpret_cast<object*>(
stack)[t->arch->frameFooterSize() + t->arch->frameReturnAddressSize()];
}
2007-12-23 19:26:35 +00:00
2014-07-11 15:47:57 +00:00
GcMethod* findMethod(Thread* t, GcMethod* method, object instance)
{
2014-05-29 04:17:25 +00:00
if ((method->flags() & ACC_STATIC) == 0) {
if (method->class_()->flags() & ACC_INTERFACE) {
return findInterfaceMethod(t, method, objectClass(t, instance));
} else if (methodVirtual(t, method)) {
2014-05-29 04:17:25 +00:00
return findVirtualMethod(t, method, objectClass(t, instance));
}
}
return method;
}
2014-07-11 15:47:57 +00:00
GcMethod* resolveTarget(MyThread* t, void* stack, GcMethod* method)
{
2014-05-29 04:17:25 +00:00
GcClass* class_ = objectClass(t, resolveThisPointer(t, stack));
2007-10-03 00:22:48 +00:00
2014-05-29 04:17:25 +00:00
if (class_->vmFlags() & BootstrapFlag) {
PROTECT(t, method);
PROTECT(t, class_);
2014-06-30 01:44:41 +00:00
resolveSystemClass(t, roots(t)->bootLoader(), class_->name());
2007-10-03 00:22:48 +00:00
}
if (method->class_()->flags() & ACC_INTERFACE) {
return findInterfaceMethod(t, method, class_);
} else {
return findVirtualMethod(t, method, class_);
}
2007-12-09 22:45:43 +00:00
}
2007-10-03 00:22:48 +00:00
2014-07-11 15:47:57 +00:00
GcMethod* resolveTarget(MyThread* t, GcClass* class_, unsigned index)
{
2014-05-29 04:17:25 +00:00
if (class_->vmFlags() & BootstrapFlag) {
PROTECT(t, class_);
2014-06-30 01:44:41 +00:00
resolveSystemClass(t, roots(t)->bootLoader(), class_->name());
}
2014-07-11 15:47:57 +00:00
return cast<GcMethod>(
t, cast<GcArray>(t, class_->virtualTable())->body()[index]);
}
2014-07-11 15:47:57 +00:00
GcCompileRoots* compileRoots(Thread* t);
2007-10-03 00:22:48 +00:00
2014-07-11 15:47:57 +00:00
intptr_t methodCompiled(Thread* t UNUSED, GcMethod* method)
{
2014-06-28 04:00:05 +00:00
return method->code()->compiled();
}
2014-07-11 15:47:57 +00:00
unsigned methodCompiledSize(Thread* t UNUSED, GcMethod* method)
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
{
2014-06-28 04:00:05 +00:00
return method->code()->compiledSize();
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
}
2014-07-11 15:47:57 +00:00
intptr_t compareIpToMethodBounds(Thread* t, intptr_t ip, object om)
{
2014-05-29 04:17:25 +00:00
GcMethod* method = cast<GcMethod>(t, om);
2008-11-23 23:58:01 +00:00
intptr_t start = methodCompiled(t, method);
if (DebugMethodTree) {
2014-07-11 15:50:18 +00:00
fprintf(stderr,
"find %p in (%p,%p)\n",
reinterpret_cast<void*>(ip),
reinterpret_cast<void*>(start),
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
reinterpret_cast<void*>(start + methodCompiledSize(t, method)));
}
if (ip < start) {
return -1;
2014-07-11 15:50:18 +00:00
} else if (ip < start
+ static_cast<intptr_t>(methodCompiledSize(t, method))) {
return 0;
} else {
return 1;
}
}
2014-07-11 15:47:57 +00:00
GcMethod* methodForIp(MyThread* t, void* ip)
{
if (DebugMethodTree) {
fprintf(stderr, "query for method containing %p\n", ip);
}
// we must use a version of the method tree at least as recent as the
// compiled form of the method containing the specified address (see
// compile(MyThread*, FixedAllocator*, BootContext*, object)):
loadMemoryBarrier();
2014-07-11 15:47:57 +00:00
return cast<GcMethod>(t,
treeQuery(t,
compileRoots(t)->methodTree(),
reinterpret_cast<intptr_t>(ip),
compileRoots(t)->methodTreeSentinal(),
compareIpToMethodBounds));
}
2007-10-03 00:22:48 +00:00
2014-07-11 15:47:57 +00:00
unsigned localSize(MyThread* t UNUSED, GcMethod* method)
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
{
2014-06-28 04:00:05 +00:00
unsigned size = method->code()->maxLocals();
2014-07-11 15:47:57 +00:00
if ((method->flags() & (ACC_SYNCHRONIZED | ACC_STATIC)) == ACC_SYNCHRONIZED) {
2014-07-11 15:50:18 +00:00
++size;
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
}
return size;
}
2014-07-11 15:47:57 +00:00
unsigned alignedFrameSize(MyThread* t, GcMethod* method)
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
{
2014-07-11 15:47:57 +00:00
return t->arch->alignFrameSize(
localSize(t, method) - method->parameterFootprint()
+ method->code()->maxStack()
+ t->arch->frameFootprint(MaxNativeCallFootprint));
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
}
2014-07-11 15:47:57 +00:00
void nextFrame(MyThread* t,
void** ip,
void** sp,
GcMethod* method,
GcMethod* target,
bool mostRecent)
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
{
2014-06-29 04:57:07 +00:00
GcCode* code = method->code();
intptr_t start = code->compiled();
void* link;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
bool methodIsMostRecent;
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
if (t->traceContext) {
link = t->traceContext->link;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
methodIsMostRecent = mostRecent and t->traceContext->methodIsMostRecent;
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
} else {
link = 0;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
methodIsMostRecent = false;
}
if (false) {
fprintf(stderr,
"nextFrame %s.%s%s target %s.%s%s ip %p sp %p\n",
method->class_()->name()->body().begin(),
method->name()->body().begin(),
method->spec()->body().begin(),
target ? target->class_()->name()->body().begin() : 0,
target ? target->name()->body().begin() : 0,
target ? target->spec()->body().begin() : 0,
*ip,
*sp);
}
2014-07-11 15:47:57 +00:00
t->arch->nextFrame(reinterpret_cast<void*>(start),
code->compiledSize(),
alignedFrameSize(t, method),
link,
methodIsMostRecent,
target ? target->parameterFootprint() : -1,
ip,
sp);
2011-01-29 18:11:27 +00:00
if (false) {
fprintf(stderr, "next frame ip %p sp %p\n", *ip, *sp);
}
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
}
2014-07-11 15:50:18 +00:00
void* getIp(MyThread* t, void* ip, void* stack)
{
// Here we use the convention that, if the return address is neither
// pushed on to the stack automatically as part of the call nor
// stored in the caller's frame, it will be saved in MyThread::ip
// instead of on the stack. See the various implementations of
// Assembler::saveFrame for details on how this is done.
return t->arch->returnAddressOffset() < 0 ? ip : t->arch->frameIp(stack);
}
2014-07-11 15:50:18 +00:00
void* getIp(MyThread* t)
{
return getIp(t, t->ip, t->stack);
}
2014-07-11 15:50:18 +00:00
class MyStackWalker : public Processor::StackWalker {
2007-12-09 22:45:43 +00:00
public:
2014-07-11 15:50:18 +00:00
enum State { Start, Next, Trace, Continuation, Method, NativeMethod, Finish };
2008-04-23 16:33:31 +00:00
2014-07-11 15:50:18 +00:00
class MyProtector : public Thread::Protector {
2007-12-09 22:45:43 +00:00
public:
2014-07-11 15:50:18 +00:00
MyProtector(MyStackWalker* walker) : Protector(walker->t), walker(walker)
{
}
2007-10-03 00:22:48 +00:00
2014-07-11 15:50:18 +00:00
virtual void visit(Heap::Visitor* v)
{
v->visit(&(walker->method_));
v->visit(&(walker->target));
2009-05-03 20:57:11 +00:00
v->visit(&(walker->continuation));
2007-12-09 22:45:43 +00:00
}
2007-10-03 00:22:48 +00:00
2007-12-09 22:45:43 +00:00
MyStackWalker* walker;
};
2014-07-11 15:50:18 +00:00
MyStackWalker(MyThread* t)
: t(t), state(Start), method_(0), target(0), count_(0), protector(this)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
if (t->traceContext) {
ip_ = t->traceContext->ip;
stack = t->traceContext->stack;
trace = t->traceContext->trace;
continuation = t->traceContext->continuation;
} else {
ip_ = getIp(t);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
stack = t->stack;
trace = t->trace;
2014-05-29 04:17:25 +00:00
continuation = t->continuation;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
}
}
2007-12-09 22:45:43 +00:00
2014-07-11 15:50:18 +00:00
MyStackWalker(MyStackWalker* w)
: t(w->t),
state(w->state),
ip_(w->ip_),
stack(w->stack),
trace(w->trace),
method_(w->method_),
target(w->target),
continuation(w->continuation),
count_(w->count_),
protector(this)
{
}
2014-07-11 15:50:18 +00:00
virtual void walk(Processor::StackVisitor* v)
{
2008-04-23 16:33:31 +00:00
for (MyStackWalker it(this); it.valid();) {
2009-07-10 14:33:38 +00:00
MyStackWalker walker(&it);
2008-04-23 16:33:31 +00:00
if (not v->visit(&walker)) {
break;
}
it.next();
}
2008-04-23 16:33:31 +00:00
}
2014-05-29 04:17:25 +00:00
2014-07-11 15:50:18 +00:00
bool valid()
{
2008-04-23 16:33:31 +00:00
while (true) {
if (false) {
fprintf(stderr, "state: %d\n", state);
}
2008-04-23 16:33:31 +00:00
switch (state) {
case Start:
if (trace and trace->nativeMethod) {
method_ = trace->nativeMethod;
state = NativeMethod;
} else {
state = Next;
2008-04-23 16:33:31 +00:00
}
break;
2007-12-09 22:45:43 +00:00
2008-04-23 16:33:31 +00:00
case Next:
if (stack) {
target = method_;
2008-04-23 16:33:31 +00:00
method_ = methodForIp(t, ip_);
if (method_) {
state = Method;
2009-05-03 20:57:11 +00:00
} else if (continuation) {
2014-06-29 03:50:32 +00:00
method_ = continuation->method();
2009-05-03 20:57:11 +00:00
state = Continuation;
2008-04-23 16:33:31 +00:00
} else {
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
state = Trace;
2008-04-23 16:33:31 +00:00
}
} else {
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
state = Trace;
2008-04-23 16:33:31 +00:00
}
2007-12-09 22:45:43 +00:00
break;
2008-04-23 16:33:31 +00:00
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
case Trace: {
if (trace) {
continuation = trace->continuation;
stack = trace->stack;
ip_ = trace->ip;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
trace = trace->next;
state = Start;
} else {
state = Finish;
}
} break;
2009-05-03 20:57:11 +00:00
case Continuation:
2008-04-23 16:33:31 +00:00
case Method:
case NativeMethod:
return true;
case Finish:
return false;
2014-05-29 04:17:25 +00:00
2008-04-23 16:33:31 +00:00
default:
abort(t);
2007-12-09 22:45:43 +00:00
}
}
}
2014-05-29 04:17:25 +00:00
2014-07-11 15:50:18 +00:00
void next()
{
2012-05-05 00:59:15 +00:00
expect(t, count_ <= stackSizeInWords(t));
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
2008-04-23 16:33:31 +00:00
switch (state) {
2009-05-03 20:57:11 +00:00
case Continuation:
2014-06-29 03:50:32 +00:00
continuation = continuation->next();
2009-05-03 20:57:11 +00:00
break;
2008-04-23 16:33:31 +00:00
case Method:
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
nextFrame(t, &ip_, &stack, method_, target, count_ == 0);
2008-04-23 16:33:31 +00:00
break;
2008-04-23 16:33:31 +00:00
case NativeMethod:
break;
2014-05-29 04:17:25 +00:00
2008-04-23 16:33:31 +00:00
default:
abort(t);
}
2014-07-11 15:50:18 +00:00
++count_;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
state = Next;
}
2014-07-11 15:47:57 +00:00
virtual GcMethod* method()
{
if (false) {
fprintf(stderr,
"method %s.%s\n",
method_->class_()->name()->body().begin(),
method_->name()->body().begin());
}
return method_;
2007-10-03 00:22:48 +00:00
}
2014-07-11 15:50:18 +00:00
virtual int ip()
{
2008-04-23 16:33:31 +00:00
switch (state) {
2009-05-03 20:57:11 +00:00
case Continuation:
2014-06-29 03:50:32 +00:00
return reinterpret_cast<intptr_t>(continuation->address())
2014-07-11 15:47:57 +00:00
- methodCompiled(t, continuation->method());
2009-05-03 20:57:11 +00:00
2008-04-23 16:33:31 +00:00
case Method:
2008-11-23 23:58:01 +00:00
return reinterpret_cast<intptr_t>(ip_) - methodCompiled(t, method_);
2014-05-29 04:17:25 +00:00
2008-04-23 16:33:31 +00:00
case NativeMethod:
return 0;
default:
abort(t);
2007-10-03 00:22:48 +00:00
}
}
2014-07-11 15:50:18 +00:00
virtual unsigned count()
{
2008-04-23 16:33:31 +00:00
unsigned count = 0;
2007-12-09 22:45:43 +00:00
2008-04-23 16:33:31 +00:00
for (MyStackWalker walker(this); walker.valid();) {
walker.next();
2014-07-11 15:50:18 +00:00
++count;
2008-04-23 16:33:31 +00:00
}
2014-05-29 04:17:25 +00:00
2008-04-23 16:33:31 +00:00
return count;
2007-10-03 00:22:48 +00:00
}
2007-12-09 22:45:43 +00:00
MyThread* t;
2008-04-23 16:33:31 +00:00
State state;
void* ip_;
2007-12-09 22:45:43 +00:00
void* stack;
MyThread::CallTrace* trace;
2014-05-29 04:17:25 +00:00
GcMethod* method_;
GcMethod* target;
2014-06-29 03:50:32 +00:00
GcContinuation* continuation;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
unsigned count_;
2007-12-09 22:45:43 +00:00
MyProtector protector;
};
2014-07-11 15:47:57 +00:00
int localOffset(MyThread* t, int v, GcMethod* method)
2007-12-09 22:45:43 +00:00
{
2014-05-29 04:17:25 +00:00
int parameterFootprint = method->parameterFootprint();
int frameSize = alignedFrameSize(t, method);
2014-07-11 15:50:18 +00:00
int offset
= ((v < parameterFootprint)
? (frameSize + parameterFootprint + t->arch->frameFooterSize()
+ t->arch->frameHeaderSize() - v - 1)
: (frameSize + parameterFootprint - v - 1));
assertT(t, offset >= 0);
return offset;
2007-12-09 22:45:43 +00:00
}
2007-10-03 00:22:48 +00:00
2014-07-11 15:47:57 +00:00
int localOffsetFromStack(MyThread* t, int index, GcMethod* method)
2009-05-03 20:57:11 +00:00
{
2014-07-11 15:50:18 +00:00
return localOffset(t, index, method) + t->arch->frameReturnAddressSize();
2009-05-03 20:57:11 +00:00
}
2014-07-11 15:47:57 +00:00
object* localObject(MyThread* t, void* stack, GcMethod* method, unsigned index)
{
2009-05-17 23:43:48 +00:00
return static_cast<object*>(stack) + localOffsetFromStack(t, index, method);
2009-05-03 20:57:11 +00:00
}
2014-07-11 15:47:57 +00:00
int stackOffsetFromFrame(MyThread* t, GcMethod* method)
2009-05-03 20:57:11 +00:00
{
return alignedFrameSize(t, method) + t->arch->frameHeaderSize();
}
2014-07-11 15:47:57 +00:00
void* stackForFrame(MyThread* t, void* frame, GcMethod* method)
{
2009-05-03 20:57:11 +00:00
return static_cast<void**>(frame) - stackOffsetFromFrame(t, method);
}
2014-07-11 15:50:18 +00:00
class PoolElement : public avian::codegen::Promise {
2007-12-09 22:45:43 +00:00
public:
2014-07-11 15:50:18 +00:00
PoolElement(Thread* t, object target, PoolElement* next)
: t(t), target(target), address(0), next(next)
{
}
2007-12-09 22:45:43 +00:00
2014-07-11 15:50:18 +00:00
virtual int64_t value()
{
assertT(t, resolved());
2008-11-23 23:58:01 +00:00
return address;
}
2014-07-11 15:50:18 +00:00
virtual bool resolved()
{
2008-11-23 23:58:01 +00:00
return address != 0;
}
Thread* t;
object target;
intptr_t address;
PoolElement* next;
2007-12-09 22:45:43 +00:00
};
class Subroutine {
public:
Subroutine(unsigned index,
unsigned returnAddress,
unsigned methodSize,
Subroutine* outer)
: index(index),
outer(outer),
returnAddress(returnAddress),
duplicatedBaseIp(methodSize * index),
visited(false)
2014-07-11 15:50:18 +00:00
{
}
// Index of this subroutine, in the (unmaterialized) list of subroutines in
// this method.
2014-06-01 03:28:27 +00:00
// Note that in the presence of nested finallys, this could theoretically end
// up being greater than the number of jsr instructions (but this will be
// extremely rare - I don't think we've seen this in practice).
const unsigned index;
// Subroutine outer to this one (if, for instance, we have nested finallys)
Subroutine* const outer;
// Starting ip in the original bytecode (always < original bytecode size)
const unsigned returnAddress;
// Starting ip for this subroutine's copy of the method bytecode
const unsigned duplicatedBaseIp;
bool visited;
};
class Context;
2014-07-11 15:50:18 +00:00
class TraceElement : public avian::codegen::TraceHandler {
2007-12-09 22:45:43 +00:00
public:
static const unsigned VirtualCall = 1 << 0;
2014-07-11 15:50:18 +00:00
static const unsigned TailCall = 1 << 1;
static const unsigned LongCall = 1 << 2;
2014-07-11 15:47:57 +00:00
TraceElement(Context* context,
unsigned ip,
GcMethod* target,
unsigned flags,
TraceElement* next,
unsigned mapSize)
: context(context),
address(0),
next(next),
target(target),
ip(ip),
argumentIndex(0),
flags(flags),
watch(false)
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
{
memset(map, 0xFF, mapSize * BytesPerWord);
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
}
2007-12-09 22:45:43 +00:00
2014-07-11 15:50:18 +00:00
virtual void handleTrace(avian::codegen::Promise* address,
unsigned argumentIndex)
{
if (this->address == 0) {
this->address = address;
this->argumentIndex = argumentIndex;
}
}
Context* context;
avian::codegen::Promise* address;
TraceElement* next;
2014-05-29 04:17:25 +00:00
GcMethod* target;
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
unsigned ip;
unsigned argumentIndex;
unsigned flags;
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
bool watch;
uintptr_t map[0];
2007-10-03 00:22:48 +00:00
};
2014-07-11 15:50:18 +00:00
class TraceElementPromise : public avian::codegen::Promise {
public:
2014-07-11 15:50:18 +00:00
TraceElementPromise(System* s, TraceElement* trace) : s(s), trace(trace)
{
}
2014-07-11 15:50:18 +00:00
virtual int64_t value()
{
assertT(s, resolved());
2009-04-22 01:39:25 +00:00
return trace->address->value();
}
2014-07-11 15:50:18 +00:00
virtual bool resolved()
{
2009-04-22 01:39:25 +00:00
return trace->address != 0 and trace->address->resolved();
}
System* s;
TraceElement* trace;
};
2008-01-07 14:51:07 +00:00
enum Event {
2008-07-05 20:21:13 +00:00
PushContextEvent,
PopContextEvent,
2008-01-07 14:51:07 +00:00
IpEvent,
MarkEvent,
ClearEvent,
PushExceptionHandlerEvent,
TraceEvent,
2008-01-07 14:51:07 +00:00
};
2014-07-11 15:47:57 +00:00
unsigned frameMapSizeInBits(MyThread* t, GcMethod* method)
{
2014-06-28 04:00:05 +00:00
return localSize(t, method) + method->code()->maxStack();
}
2014-07-11 15:47:57 +00:00
unsigned frameMapSizeInWords(MyThread* t, GcMethod* method)
2008-01-07 14:51:07 +00:00
{
2013-02-11 01:06:15 +00:00
return ceilingDivide(frameMapSizeInBits(t, method), BitsPerWord);
2008-01-07 14:51:07 +00:00
}
enum Thunk {
#define THUNK(s) s##Thunk,
#include "thunks.cpp"
#undef THUNK
};
const unsigned ThunkCount = idleIfNecessaryThunk + 1;
2014-07-11 15:50:18 +00:00
intptr_t getThunk(MyThread* t, Thunk thunk);
2008-11-23 23:58:01 +00:00
class BootContext {
public:
2014-07-11 15:50:18 +00:00
class MyProtector : public Thread::Protector {
2008-11-23 23:58:01 +00:00
public:
2014-07-11 15:50:18 +00:00
MyProtector(Thread* t, BootContext* c) : Protector(t), c(c)
{
}
2008-11-23 23:58:01 +00:00
2014-07-11 15:50:18 +00:00
virtual void visit(Heap::Visitor* v)
{
v->visit(&(c->constants));
v->visit(&(c->calls));
2008-11-23 23:58:01 +00:00
}
BootContext* c;
};
2014-07-11 15:47:57 +00:00
BootContext(Thread* t,
GcTriple* constants,
GcTriple* calls,
avian::codegen::DelayedPromise* addresses,
Zone* zone,
OffsetResolver* resolver)
: protector(t, this),
constants(constants),
calls(calls),
addresses(addresses),
addressSentinal(addresses),
zone(zone),
resolver(resolver)
2014-07-11 15:50:18 +00:00
{
}
2008-11-23 23:58:01 +00:00
MyProtector protector;
2014-06-29 04:57:07 +00:00
GcTriple* constants;
GcTriple* calls;
avian::codegen::DelayedPromise* addresses;
avian::codegen::DelayedPromise* addressSentinal;
2008-11-23 23:58:01 +00:00
Zone* zone;
OffsetResolver* resolver;
2008-11-23 23:58:01 +00:00
};
class Context {
2007-10-10 22:39:40 +00:00
public:
2014-07-11 15:50:18 +00:00
class MyResource : public Thread::AutoResource {
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
public:
2014-07-11 15:50:18 +00:00
MyResource(Context* c) : AutoResource(c->thread), c(c)
{
}
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
2014-07-11 15:50:18 +00:00
virtual void release()
{
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
c->dispose();
}
Context* c;
};
2014-07-11 15:50:18 +00:00
class MyProtector : public Thread::Protector {
2007-12-09 22:45:43 +00:00
public:
2014-07-11 15:50:18 +00:00
MyProtector(Context* c) : Protector(c->thread), c(c)
{
}
2007-12-09 22:45:43 +00:00
2014-07-11 15:50:18 +00:00
virtual void visit(Heap::Visitor* v)
{
v->visit(&(c->method));
2007-12-09 22:45:43 +00:00
for (PoolElement* p = c->objectPool; p; p = p->next) {
2008-11-23 23:58:01 +00:00
v->visit(&(p->target));
}
2007-12-09 22:45:43 +00:00
for (TraceElement* p = c->traceLog; p; p = p->next) {
v->visit(&(p->target));
2007-12-09 22:45:43 +00:00
}
}
Context* c;
2007-10-10 22:39:40 +00:00
};
2014-07-11 15:50:18 +00:00
class MyClient : public Compiler::Client {
public:
2014-07-11 15:50:18 +00:00
MyClient(MyThread* t) : t(t)
{
}
2014-07-11 15:50:18 +00:00
virtual intptr_t getThunk(avian::codegen::lir::UnaryOperation, unsigned)
{
abort(t);
}
2014-05-29 04:17:25 +00:00
2014-07-11 15:50:18 +00:00
virtual intptr_t getThunk(avian::codegen::lir::BinaryOperation op,
unsigned size,
unsigned resultSize)
{
if (size == 8) {
2014-07-11 15:50:18 +00:00
switch (op) {
case avian::codegen::lir::Absolute:
assertT(t, resultSize == 8);
2009-12-01 16:21:33 +00:00
return local::getThunk(t, absoluteLongThunk);
case avian::codegen::lir::FloatNegate:
assertT(t, resultSize == 8);
return local::getThunk(t, negateDoubleThunk);
case avian::codegen::lir::FloatSquareRoot:
assertT(t, resultSize == 8);
return local::getThunk(t, squareRootDoubleThunk);
case avian::codegen::lir::Float2Float:
assertT(t, resultSize == 4);
return local::getThunk(t, doubleToFloatThunk);
case avian::codegen::lir::Float2Int:
if (resultSize == 8) {
return local::getThunk(t, doubleToLongThunk);
} else {
assertT(t, resultSize == 4);
return local::getThunk(t, doubleToIntThunk);
}
case avian::codegen::lir::Int2Float:
if (resultSize == 8) {
return local::getThunk(t, longToDoubleThunk);
} else {
assertT(t, resultSize == 4);
return local::getThunk(t, longToFloatThunk);
}
2014-05-29 04:17:25 +00:00
2014-07-11 15:50:18 +00:00
default:
abort(t);
}
} else {
assertT(t, size == 4);
2014-07-11 15:50:18 +00:00
switch (op) {
case avian::codegen::lir::Absolute:
assertT(t, resultSize == 4);
2009-12-01 16:21:33 +00:00
return local::getThunk(t, absoluteIntThunk);
case avian::codegen::lir::FloatNegate:
assertT(t, resultSize == 4);
return local::getThunk(t, negateFloatThunk);
case avian::codegen::lir::FloatAbsolute:
assertT(t, resultSize == 4);
return local::getThunk(t, absoluteFloatThunk);
case avian::codegen::lir::Float2Float:
assertT(t, resultSize == 8);
return local::getThunk(t, floatToDoubleThunk);
case avian::codegen::lir::Float2Int:
if (resultSize == 4) {
return local::getThunk(t, floatToIntThunk);
} else {
assertT(t, resultSize == 8);
return local::getThunk(t, floatToLongThunk);
}
case avian::codegen::lir::Int2Float:
if (resultSize == 4) {
return local::getThunk(t, intToFloatThunk);
} else {
assertT(t, resultSize == 8);
return local::getThunk(t, intToDoubleThunk);
}
2014-07-11 15:50:18 +00:00
default:
abort(t);
}
}
}
2014-07-11 15:50:18 +00:00
virtual intptr_t getThunk(avian::codegen::lir::TernaryOperation op,
unsigned size,
unsigned,
bool* threadParameter)
{
*threadParameter = false;
if (size == 8) {
switch (op) {
case avian::codegen::lir::Divide:
*threadParameter = true;
return local::getThunk(t, divideLongThunk);
case avian::codegen::lir::Remainder:
*threadParameter = true;
return local::getThunk(t, moduloLongThunk);
case avian::codegen::lir::FloatAdd:
return local::getThunk(t, addDoubleThunk);
case avian::codegen::lir::FloatSubtract:
return local::getThunk(t, subtractDoubleThunk);
case avian::codegen::lir::FloatMultiply:
return local::getThunk(t, multiplyDoubleThunk);
case avian::codegen::lir::FloatDivide:
return local::getThunk(t, divideDoubleThunk);
case avian::codegen::lir::FloatRemainder:
return local::getThunk(t, moduloDoubleThunk);
case avian::codegen::lir::JumpIfFloatEqual:
case avian::codegen::lir::JumpIfFloatNotEqual:
case avian::codegen::lir::JumpIfFloatLess:
case avian::codegen::lir::JumpIfFloatGreater:
case avian::codegen::lir::JumpIfFloatLessOrEqual:
case avian::codegen::lir::JumpIfFloatGreaterOrUnordered:
case avian::codegen::lir::JumpIfFloatGreaterOrEqualOrUnordered:
return local::getThunk(t, compareDoublesGThunk);
case avian::codegen::lir::JumpIfFloatGreaterOrEqual:
case avian::codegen::lir::JumpIfFloatLessOrUnordered:
case avian::codegen::lir::JumpIfFloatLessOrEqualOrUnordered:
return local::getThunk(t, compareDoublesLThunk);
2014-07-11 15:50:18 +00:00
default:
abort(t);
}
} else {
assertT(t, size == 4);
switch (op) {
case avian::codegen::lir::Divide:
*threadParameter = true;
return local::getThunk(t, divideIntThunk);
case avian::codegen::lir::Remainder:
*threadParameter = true;
2009-10-29 20:14:44 +00:00
return local::getThunk(t, moduloIntThunk);
case avian::codegen::lir::FloatAdd:
return local::getThunk(t, addFloatThunk);
case avian::codegen::lir::FloatSubtract:
return local::getThunk(t, subtractFloatThunk);
case avian::codegen::lir::FloatMultiply:
return local::getThunk(t, multiplyFloatThunk);
case avian::codegen::lir::FloatDivide:
return local::getThunk(t, divideFloatThunk);
case avian::codegen::lir::FloatRemainder:
return local::getThunk(t, moduloFloatThunk);
case avian::codegen::lir::JumpIfFloatEqual:
case avian::codegen::lir::JumpIfFloatNotEqual:
case avian::codegen::lir::JumpIfFloatLess:
case avian::codegen::lir::JumpIfFloatGreater:
case avian::codegen::lir::JumpIfFloatLessOrEqual:
case avian::codegen::lir::JumpIfFloatGreaterOrUnordered:
case avian::codegen::lir::JumpIfFloatGreaterOrEqualOrUnordered:
return local::getThunk(t, compareFloatsGThunk);
case avian::codegen::lir::JumpIfFloatGreaterOrEqual:
case avian::codegen::lir::JumpIfFloatLessOrUnordered:
case avian::codegen::lir::JumpIfFloatLessOrEqualOrUnordered:
return local::getThunk(t, compareFloatsLThunk);
2014-07-11 15:50:18 +00:00
default:
abort(t);
}
}
}
MyThread* t;
};
2014-05-29 04:17:25 +00:00
Context(MyThread* t, BootContext* bootContext, GcMethod* method)
: thread(t),
2014-05-05 04:02:47 +00:00
zone(t->m->heap, InitialZoneCapacityInBytes),
assembler(t->arch->makeAssembler(t->m->heap, &zone)),
client(t),
compiler(makeCompiler(t->m->system, assembler, &zone, &client)),
method(method),
bootContext(bootContext),
objectPool(0),
subroutineCount(0),
traceLog(0),
visitTable(
2014-07-11 15:47:57 +00:00
Slice<uint16_t>::allocAndSet(&zone, method->code()->length(), 0)),
rootTable(Slice<uintptr_t>::allocAndSet(
&zone,
method->code()->length() * frameMapSizeInWords(t, method),
~(uintptr_t)0)),
executableAllocator(0),
executableStart(0),
executableSize(0),
objectPoolCount(0),
traceLogCount(0),
dirtyRoots(false),
leaf(true),
eventLog(t->m->system, t->m->heap, 1024),
protector(this),
resource(this),
argumentBuffer(
(ir::Value**)t->m->heap->allocate(256 * sizeof(ir::Value*)),
256) // below the maximal allowed parameter count for Java
2014-07-11 15:50:18 +00:00
{
}
Context(MyThread* t)
: thread(t),
2014-05-05 04:02:47 +00:00
zone(t->m->heap, InitialZoneCapacityInBytes),
assembler(t->arch->makeAssembler(t->m->heap, &zone)),
client(t),
compiler(0),
method(0),
bootContext(0),
objectPool(0),
subroutineCount(0),
traceLog(0),
visitTable(0, 0),
rootTable(0, 0),
executableAllocator(0),
executableStart(0),
executableSize(0),
objectPoolCount(0),
traceLogCount(0),
dirtyRoots(false),
leaf(true),
eventLog(t->m->system, t->m->heap, 0),
protector(this),
resource(this),
argumentBuffer(0, 0)
2014-07-11 15:50:18 +00:00
{
}
2014-07-11 15:50:18 +00:00
~Context()
{
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
dispose();
}
2014-07-11 15:50:18 +00:00
void dispose()
{
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
if (compiler) {
compiler->dispose();
}
2008-02-11 17:21:41 +00:00
assembler->dispose();
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
if (executableAllocator) {
executableAllocator->free(executableStart, executableSize);
}
eventLog.dispose();
zone.dispose();
if (argumentBuffer.begin()) {
thread->m->heap->free(argumentBuffer.begin(), 256 * sizeof(ir::Value*));
}
}
void extendLogicalCode(unsigned more)
{
compiler->extendLogicalCode(more);
visitTable = visitTable.cloneAndSet(&zone, visitTable.count + more, 0);
rootTable = rootTable.cloneAndSet(
&zone,
rootTable.count + more * frameMapSizeInWords(thread, method),
~(uintptr_t)0);
}
2008-02-11 17:21:41 +00:00
MyThread* thread;
Zone zone;
avian::codegen::Assembler* assembler;
MyClient client;
avian::codegen::Compiler* compiler;
2014-05-29 04:17:25 +00:00
GcMethod* method;
2008-11-23 23:58:01 +00:00
BootContext* bootContext;
PoolElement* objectPool;
unsigned subroutineCount;
TraceElement* traceLog;
Slice<uint16_t> visitTable;
Slice<uintptr_t> rootTable;
2014-05-05 04:43:27 +00:00
Alloc* executableAllocator;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
void* executableStart;
unsigned executableSize;
unsigned objectPoolCount;
unsigned traceLogCount;
bool dirtyRoots;
bool leaf;
2008-01-07 14:51:07 +00:00
Vector eventLog;
MyProtector protector;
MyResource resource;
Slice<ir::Value*> argumentBuffer;
};
2014-07-11 15:50:18 +00:00
unsigned translateLocalIndex(Context* context,
unsigned footprint,
unsigned index)
2009-05-03 20:57:11 +00:00
{
2014-05-29 04:17:25 +00:00
unsigned parameterFootprint = context->method->parameterFootprint();
2009-05-03 20:57:11 +00:00
if (index < parameterFootprint) {
return parameterFootprint - index - footprint;
} else {
return index;
}
}
2014-05-01 18:44:42 +00:00
ir::Value* loadLocal(Context* context,
unsigned footprint,
ir::Type type,
unsigned index)
2009-05-03 20:57:11 +00:00
{
2014-05-02 16:05:19 +00:00
ir::Value* result = context->compiler->loadLocal(
2014-05-01 13:18:12 +00:00
type, translateLocalIndex(context, footprint, index));
2014-05-02 16:05:19 +00:00
assertT(context->thread, type == result->type);
2014-05-02 16:05:19 +00:00
return result;
2009-05-03 20:57:11 +00:00
}
2014-05-01 18:44:42 +00:00
void storeLocal(Context* context,
unsigned footprint,
2014-05-02 16:05:19 +00:00
ir::Type type UNUSED,
2014-05-01 18:44:42 +00:00
ir::Value* value,
unsigned index)
2009-05-03 20:57:11 +00:00
{
assertT(context->thread, type == value->type);
context->compiler->storeLocal(value,
translateLocalIndex(context, footprint, index));
2009-05-03 20:57:11 +00:00
}
2014-02-25 22:15:37 +00:00
avian::util::FixedAllocator* codeAllocator(MyThread* t);
2014-05-01 19:56:39 +00:00
ir::Type operandTypeForFieldCode(Thread* t, unsigned code)
{
switch (code) {
case ByteField:
case BooleanField:
case CharField:
case ShortField:
case IntField:
2014-06-01 20:22:14 +00:00
return ir::Type::i4();
2014-05-01 19:56:39 +00:00
case LongField:
2014-06-01 20:22:14 +00:00
return ir::Type::i8();
2014-05-01 19:56:39 +00:00
case ObjectField:
2014-06-01 20:22:14 +00:00
return ir::Type::object();
2014-05-01 19:56:39 +00:00
case FloatField:
2014-06-01 20:22:14 +00:00
return ir::Type::f4();
2014-05-01 19:56:39 +00:00
case DoubleField:
2014-06-01 20:22:14 +00:00
return ir::Type::f8();
2014-05-01 19:56:39 +00:00
case VoidField:
2014-06-01 20:22:14 +00:00
return ir::Type::void_();
2014-05-01 19:56:39 +00:00
default:
abort(t);
}
}
2014-05-01 20:30:45 +00:00
unsigned methodReferenceParameterFootprint(Thread* t,
2014-06-29 04:57:07 +00:00
GcReference* reference,
2014-05-01 20:30:45 +00:00
bool isStatic)
{
return parameterFootprint(
t,
2014-07-11 15:47:57 +00:00
reinterpret_cast<const char*>(reference->spec()->body().begin()),
2014-05-01 20:30:45 +00:00
isStatic);
}
2014-06-29 04:57:07 +00:00
int methodReferenceReturnCode(Thread* t, GcReference* reference)
2014-05-01 20:30:45 +00:00
{
unsigned parameterCount;
unsigned parameterFootprint;
unsigned returnCode;
2014-07-11 15:47:57 +00:00
scanMethodSpec(
t,
reinterpret_cast<const char*>(reference->spec()->body().begin()),
true,
&parameterCount,
&parameterFootprint,
&returnCode);
2014-05-01 20:30:45 +00:00
return returnCode;
}
class Frame {
public:
2014-05-05 16:49:50 +00:00
Frame(Context* context, ir::Type* stackMap)
2014-05-01 02:11:54 +00:00
: context(context),
t(context->thread),
c(context->compiler),
subroutine(0),
stackMap(stackMap),
ip(0),
sp(localSize()),
2014-06-01 20:22:14 +00:00
level(0)
2007-12-09 22:45:43 +00:00
{
2014-07-11 15:47:57 +00:00
memset(stackMap, 0, context->method->code()->maxStack() * sizeof(ir::Type));
2007-12-09 22:45:43 +00:00
}
2014-05-05 16:49:50 +00:00
Frame(Frame* f, ir::Type* stackMap)
2014-05-01 02:11:54 +00:00
: context(f->context),
t(context->thread),
c(context->compiler),
subroutine(f->subroutine),
stackMap(stackMap),
ip(f->ip),
sp(f->sp),
2014-06-01 20:22:14 +00:00
level(f->level + 1)
2007-12-09 22:45:43 +00:00
{
2014-05-05 16:49:50 +00:00
memcpy(stackMap,
f->stackMap,
2014-06-28 04:00:05 +00:00
context->method->code()->maxStack() * sizeof(ir::Type));
2008-01-07 14:51:07 +00:00
if (level > 1) {
2008-07-05 20:21:13 +00:00
context->eventLog.append(PushContextEvent);
2008-01-07 14:51:07 +00:00
}
}
2014-07-11 15:50:18 +00:00
~Frame()
{
dispose();
}
2014-07-11 15:50:18 +00:00
void dispose()
{
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
if (level > 1) {
2014-05-01 18:44:42 +00:00
context->eventLog.append(PopContextEvent);
2008-01-07 14:51:07 +00:00
}
2007-10-10 22:39:40 +00:00
}
ir::Value* append(object o)
2014-05-01 18:44:42 +00:00
{
BootContext* bc = context->bootContext;
if (bc) {
2014-07-11 15:50:18 +00:00
avian::codegen::Promise* p = new (bc->zone)
avian::codegen::ListenPromise(t->m->system, bc->zone);
2008-11-23 23:58:01 +00:00
PROTECT(t, o);
object pointer = makePointer(t, p);
bc->constants = makeTriple(t, o, pointer, bc->constants);
2008-11-23 23:58:01 +00:00
return c->binaryOp(
lir::Add,
2014-06-01 20:22:14 +00:00
ir::Type::object(),
c->memory(
2014-06-01 20:22:14 +00:00
c->threadRegister(), ir::Type::object(), TARGET_THREAD_HEAPIMAGE),
c->promiseConstant(p, ir::Type::object()));
2008-11-23 23:58:01 +00:00
} else {
for (PoolElement* e = context->objectPool; e; e = e->next) {
if (o == e->target) {
2014-06-01 20:22:14 +00:00
return c->address(ir::Type::object(), e);
}
}
2014-07-11 15:50:18 +00:00
context->objectPool = new (&context->zone)
PoolElement(t, o, context->objectPool);
2008-11-23 23:58:01 +00:00
2014-07-11 15:50:18 +00:00
++context->objectPoolCount;
2014-06-01 20:22:14 +00:00
return c->address(ir::Type::object(), context->objectPool);
2008-11-23 23:58:01 +00:00
}
2007-10-10 22:39:40 +00:00
}
2014-07-11 15:50:18 +00:00
unsigned localSize()
{
return local::localSize(t, context->method);
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:50:18 +00:00
unsigned stackSize()
{
2014-06-28 04:00:05 +00:00
return context->method->code()->maxStack();
}
2014-07-11 15:50:18 +00:00
unsigned frameSize()
{
2008-01-07 14:51:07 +00:00
return localSize() + stackSize();
2007-12-09 22:45:43 +00:00
}
2014-05-05 16:49:50 +00:00
void set(unsigned index, ir::Type type)
{
assertT(t, index < frameSize());
2007-10-10 22:39:40 +00:00
2014-06-01 20:22:14 +00:00
if (type == ir::Type::object()) {
2008-02-11 17:21:41 +00:00
context->eventLog.append(MarkEvent);
context->eventLog.append2(index);
} else {
context->eventLog.append(ClearEvent);
context->eventLog.append2(index);
2008-01-07 14:51:07 +00:00
}
int si = index - localSize();
if (si >= 0) {
2008-02-11 17:21:41 +00:00
stackMap[si] = type;
2008-01-07 14:51:07 +00:00
}
2007-10-10 22:39:40 +00:00
}
2014-05-05 16:49:50 +00:00
ir::Type get(unsigned index)
{
assertT(t, index < frameSize());
2008-01-07 14:51:07 +00:00
int si = index - localSize();
assertT(t, si >= 0);
2008-02-11 17:21:41 +00:00
return stackMap[si];
2007-10-10 22:39:40 +00:00
}
2014-07-11 15:50:18 +00:00
void popped(unsigned count)
{
assertT(t, sp >= count);
assertT(t, sp - count >= localSize());
while (count) {
2014-06-01 20:22:14 +00:00
set(--sp, ir::Type::i4());
2014-07-11 15:50:18 +00:00
--count;
}
}
2007-12-09 22:45:43 +00:00
2014-07-11 15:50:18 +00:00
avian::codegen::Promise* addressPromise(avian::codegen::Promise* p)
{
BootContext* bc = context->bootContext;
if (bc) {
2014-07-11 15:50:18 +00:00
bc->addresses = new (bc->zone) avian::codegen::DelayedPromise(
t->m->system, bc->zone, p, bc->addresses);
return bc->addresses;
} else {
return p;
}
}
2014-05-01 18:44:42 +00:00
ir::Value* addressOperand(avian::codegen::Promise* p)
{
2014-06-01 20:22:14 +00:00
return c->promiseConstant(p, ir::Type::iptr());
}
2014-05-01 18:44:42 +00:00
ir::Value* absoluteAddressOperand(avian::codegen::Promise* p)
{
return context->bootContext
2014-02-25 22:46:35 +00:00
? c->binaryOp(
lir::Add,
2014-06-01 20:22:14 +00:00
ir::Type::iptr(),
c->memory(c->threadRegister(),
2014-06-01 20:22:14 +00:00
ir::Type::iptr(),
2014-02-25 22:46:35 +00:00
TARGET_THREAD_CODEIMAGE),
c->promiseConstant(
new (&context->zone) avian::codegen::OffsetPromise(
p,
-reinterpret_cast<intptr_t>(
codeAllocator(t)->memory.begin())),
2014-06-01 20:22:14 +00:00
ir::Type::iptr()))
2014-02-25 22:46:35 +00:00
: addressOperand(p);
}
ir::Value* machineIpValue(unsigned logicalIp)
2014-05-01 18:44:42 +00:00
{
2014-06-01 20:22:14 +00:00
return c->promiseConstant(machineIp(logicalIp), ir::Type::iptr());
2007-12-16 00:24:15 +00:00
}
unsigned duplicatedIp(unsigned bytecodeIp)
{
if (UNLIKELY(subroutine)) {
return bytecodeIp + subroutine->duplicatedBaseIp;
} else {
return bytecodeIp;
}
}
Promise* machineIp(unsigned bytecodeIp)
{
return c->machineIp(duplicatedIp(bytecodeIp));
2008-01-07 14:51:07 +00:00
}
void visitLogicalIp(unsigned bytecodeIp)
{
unsigned dupIp = duplicatedIp(bytecodeIp);
c->visitLogicalIp(dupIp);
context->eventLog.append(IpEvent);
context->eventLog.append2(bytecodeIp);
}
void startLogicalIp(unsigned bytecodeIp)
{
unsigned dupIp = duplicatedIp(bytecodeIp);
c->startLogicalIp(dupIp);
2008-04-20 05:23:08 +00:00
context->eventLog.append(IpEvent);
context->eventLog.append2(bytecodeIp);
this->ip = bytecodeIp;
}
void push(ir::Type type, ir::Value* o)
2014-05-01 18:44:42 +00:00
{
assertT(t, type == o->type);
c->push(o->type, o);
assertT(t, sp + 1 <= frameSize());
set(sp++, type);
}
2014-07-11 15:50:18 +00:00
void pushObject()
{
2014-06-01 20:22:14 +00:00
c->pushed(ir::Type::object());
assertT(t, sp + 1 <= frameSize());
2014-06-01 20:22:14 +00:00
set(sp++, ir::Type::object());
}
2007-12-16 21:30:19 +00:00
void pushLarge(ir::Type type, ir::Value* o)
2014-05-01 18:44:42 +00:00
{
assertT(t, o->type == type);
c->push(type, o);
assertT(t, sp + 2 <= frameSize());
set(sp++, type);
set(sp++, type);
}
2014-06-01 20:22:14 +00:00
void popFootprint(unsigned count)
{
popped(count);
2009-05-15 02:08:01 +00:00
c->popped(count);
}
ir::Value* pop(ir::Type type)
2014-05-01 18:44:42 +00:00
{
assertT(t, sp >= 1);
assertT(t, sp - 1 >= localSize());
assertT(t, get(sp - 1) == type);
2014-06-01 20:22:14 +00:00
set(--sp, ir::Type::i4());
return c->pop(type);
2007-12-09 22:45:43 +00:00
}
2014-05-01 18:44:42 +00:00
ir::Value* popLarge(ir::Type type)
2014-05-01 18:44:42 +00:00
{
assertT(t, sp >= 1);
assertT(t, sp - 2 >= localSize());
assertT(t, get(sp - 1) == type);
assertT(t, get(sp - 2) == type);
sp -= 2;
return c->pop(type);
2007-10-10 22:39:40 +00:00
}
void load(ir::Type type, unsigned index)
2014-05-02 15:01:57 +00:00
{
assertT(t, index < localSize());
push(type, loadLocal(context, 1, type, index));
2014-05-02 15:01:57 +00:00
}
2014-07-11 15:50:18 +00:00
void loadLarge(ir::Type type, unsigned index)
{
assertT(t, index < static_cast<unsigned>(localSize() - 1));
2014-05-05 21:49:25 +00:00
pushLarge(type, loadLocal(context, 2, type, index));
2007-12-09 22:45:43 +00:00
}
void store(ir::Type type, unsigned index)
2014-05-02 16:05:19 +00:00
{
assertT(t,
2014-07-11 15:47:57 +00:00
type == ir::Type::i4() || type == ir::Type::f4()
|| type == ir::Type::object());
storeLocal(context, 1, type, pop(type), index);
unsigned ti = translateLocalIndex(context, 1, index);
assertT(t, ti < localSize());
set(ti, type);
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:50:18 +00:00
void storeLarge(ir::Type type, unsigned index)
{
assertT(t, type.rawSize() == 8);
2014-05-05 21:49:25 +00:00
storeLocal(context, 2, type, popLarge(type), index);
unsigned ti = translateLocalIndex(context, 2, index);
assertT(t, ti + 1 < localSize());
2014-05-05 21:49:25 +00:00
set(ti, type);
set(ti + 1, type);
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:50:18 +00:00
void dup()
{
2014-06-01 20:22:14 +00:00
c->push(ir::Type::i4(), c->peek(1, 0));
2008-02-11 17:21:41 +00:00
assertT(t, sp + 1 <= frameSize());
assertT(t, sp - 1 >= localSize());
2014-05-05 21:49:25 +00:00
set(sp, get(sp - 1));
2014-07-11 15:50:18 +00:00
++sp;
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:50:18 +00:00
void dupX1()
{
2014-06-01 20:22:14 +00:00
ir::Value* s0 = c->pop(ir::Type::i4());
ir::Value* s1 = c->pop(ir::Type::i4());
2008-02-11 17:21:41 +00:00
2014-06-01 20:22:14 +00:00
c->push(ir::Type::i4(), s0);
c->push(ir::Type::i4(), s1);
c->push(ir::Type::i4(), s0);
assertT(t, sp + 1 <= frameSize());
assertT(t, sp - 2 >= localSize());
2014-05-05 21:49:25 +00:00
ir::Type b2 = get(sp - 2);
ir::Type b1 = get(sp - 1);
set(sp - 1, b2);
set(sp - 2, b1);
2014-07-11 15:50:18 +00:00
set(sp, b1);
2014-05-05 21:49:25 +00:00
2014-07-11 15:50:18 +00:00
++sp;
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:50:18 +00:00
void dupX2()
{
2014-06-01 20:22:14 +00:00
ir::Value* s0 = c->pop(ir::Type::i4());
2008-02-11 17:21:41 +00:00
if (get(sp - 2).rawSize() == 8) {
2014-06-01 20:22:14 +00:00
ir::Value* s1 = c->pop(ir::Type::i8());
2014-06-01 20:22:14 +00:00
c->push(ir::Type::i4(), s0);
c->push(ir::Type::i8(), s1);
c->push(ir::Type::i4(), s0);
2008-02-11 17:21:41 +00:00
} else {
2014-06-01 20:22:14 +00:00
ir::Value* s1 = c->pop(ir::Type::i4());
ir::Value* s2 = c->pop(ir::Type::i4());
2008-02-11 17:21:41 +00:00
2014-06-01 20:22:14 +00:00
c->push(ir::Type::i4(), s0);
c->push(ir::Type::i4(), s2);
c->push(ir::Type::i4(), s1);
c->push(ir::Type::i4(), s0);
2008-02-11 17:21:41 +00:00
}
assertT(t, sp + 1 <= frameSize());
assertT(t, sp - 3 >= localSize());
2014-05-05 21:49:25 +00:00
ir::Type b3 = get(sp - 3);
ir::Type b2 = get(sp - 2);
ir::Type b1 = get(sp - 1);
set(sp - 2, b3);
set(sp - 1, b2);
set(sp - 3, b1);
2014-07-11 15:50:18 +00:00
set(sp, b1);
2014-05-05 21:49:25 +00:00
2014-07-11 15:50:18 +00:00
++sp;
2007-10-10 22:39:40 +00:00
}
2014-07-11 15:50:18 +00:00
void dup2()
{
if (get(sp - 1).rawSize() == 8) {
2014-06-01 20:22:14 +00:00
c->push(ir::Type::i8(), c->peek(2, 0));
2008-02-11 17:21:41 +00:00
} else {
2014-06-01 20:22:14 +00:00
ir::Value* s0 = c->pop(ir::Type::i4());
ir::Value* s1 = c->pop(ir::Type::i4());
2008-02-11 17:21:41 +00:00
2014-06-01 20:22:14 +00:00
c->push(ir::Type::i4(), s1);
c->push(ir::Type::i4(), s0);
c->push(ir::Type::i4(), s1);
c->push(ir::Type::i4(), s0);
2008-02-11 17:21:41 +00:00
}
assertT(t, sp + 2 <= frameSize());
assertT(t, sp - 2 >= localSize());
2014-05-05 21:49:25 +00:00
ir::Type b2 = get(sp - 2);
ir::Type b1 = get(sp - 1);
set(sp, b2);
set(sp + 1, b1);
sp += 2;
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:50:18 +00:00
void dup2X1()
{
if (get(sp - 1).rawSize() == 8) {
2014-06-01 20:22:14 +00:00
ir::Value* s0 = c->pop(ir::Type::i8());
ir::Value* s1 = c->pop(ir::Type::i4());
2008-02-11 17:21:41 +00:00
2014-06-01 20:22:14 +00:00
c->push(ir::Type::i8(), s0);
c->push(ir::Type::i4(), s1);
c->push(ir::Type::i8(), s0);
} else {
2014-06-01 20:22:14 +00:00
ir::Value* s0 = c->pop(ir::Type::i4());
ir::Value* s1 = c->pop(ir::Type::i4());
ir::Value* s2 = c->pop(ir::Type::i4());
c->push(ir::Type::i4(), s1);
c->push(ir::Type::i4(), s0);
c->push(ir::Type::i4(), s2);
c->push(ir::Type::i4(), s1);
c->push(ir::Type::i4(), s0);
2008-02-11 17:21:41 +00:00
}
2007-12-09 22:45:43 +00:00
assertT(t, sp + 2 <= frameSize());
assertT(t, sp - 3 >= localSize());
2014-05-05 21:49:25 +00:00
ir::Type b3 = get(sp - 3);
ir::Type b2 = get(sp - 2);
ir::Type b1 = get(sp - 1);
set(sp - 1, b3);
set(sp - 3, b2);
2014-07-11 15:50:18 +00:00
set(sp, b2);
2014-05-05 21:49:25 +00:00
set(sp - 2, b1);
set(sp + 1, b1);
sp += 2;
}
2014-07-11 15:50:18 +00:00
void dup2X2()
{
if (get(sp - 1).rawSize() == 8) {
2014-06-01 20:22:14 +00:00
ir::Value* s0 = c->pop(ir::Type::i8());
if (get(sp - 3).rawSize() == 8) {
2014-06-01 20:22:14 +00:00
ir::Value* s1 = c->pop(ir::Type::i8());
2014-06-01 20:22:14 +00:00
c->push(ir::Type::i8(), s0);
c->push(ir::Type::i8(), s1);
c->push(ir::Type::i8(), s0);
2008-02-11 17:21:41 +00:00
} else {
2014-06-01 20:22:14 +00:00
ir::Value* s1 = c->pop(ir::Type::i4());
ir::Value* s2 = c->pop(ir::Type::i4());
2008-02-11 17:21:41 +00:00
2014-06-01 20:22:14 +00:00
c->push(ir::Type::i8(), s0);
c->push(ir::Type::i4(), s2);
c->push(ir::Type::i4(), s1);
c->push(ir::Type::i8(), s0);
2008-02-11 17:21:41 +00:00
}
} else {
2014-06-01 20:22:14 +00:00
ir::Value* s0 = c->pop(ir::Type::i4());
ir::Value* s1 = c->pop(ir::Type::i4());
ir::Value* s2 = c->pop(ir::Type::i4());
ir::Value* s3 = c->pop(ir::Type::i4());
c->push(ir::Type::i4(), s1);
c->push(ir::Type::i4(), s0);
c->push(ir::Type::i4(), s3);
c->push(ir::Type::i4(), s2);
c->push(ir::Type::i4(), s1);
c->push(ir::Type::i4(), s0);
2008-02-11 17:21:41 +00:00
}
2007-10-02 00:08:17 +00:00
assertT(t, sp + 2 <= frameSize());
assertT(t, sp - 4 >= localSize());
2014-05-05 21:49:25 +00:00
ir::Type b4 = get(sp - 4);
ir::Type b3 = get(sp - 3);
ir::Type b2 = get(sp - 2);
ir::Type b1 = get(sp - 1);
set(sp - 2, b4);
set(sp - 1, b3);
set(sp - 4, b2);
2014-07-11 15:50:18 +00:00
set(sp, b2);
2014-05-05 21:49:25 +00:00
set(sp - 3, b1);
set(sp + 1, b1);
sp += 2;
2007-12-09 22:45:43 +00:00
}
2007-10-02 00:08:17 +00:00
2014-07-11 15:50:18 +00:00
void swap()
{
2014-06-01 20:22:14 +00:00
ir::Value* s0 = c->pop(ir::Type::i4());
ir::Value* s1 = c->pop(ir::Type::i4());
2007-10-02 00:08:17 +00:00
2014-06-01 20:22:14 +00:00
c->push(ir::Type::i4(), s0);
c->push(ir::Type::i4(), s1);
2007-10-02 00:08:17 +00:00
assertT(t, sp - 2 >= localSize());
2014-05-05 21:49:25 +00:00
ir::Type saved = get(sp - 1);
set(sp - 1, get(sp - 2));
set(sp - 2, saved);
2007-10-02 00:08:17 +00:00
}
2014-07-11 15:47:57 +00:00
TraceElement* trace(GcMethod* target, unsigned flags)
{
2008-01-07 14:51:07 +00:00
unsigned mapSize = frameMapSizeInWords(t, context->method);
TraceElement* e = context->traceLog = new (
context->zone.allocate(sizeof(TraceElement) + (mapSize * BytesPerWord)))
TraceElement(context,
duplicatedIp(ip),
target,
flags,
context->traceLog,
mapSize);
2014-07-11 15:50:18 +00:00
++context->traceLogCount;
2008-01-07 14:51:07 +00:00
context->eventLog.append(TraceEvent);
context->eventLog.appendAddress(e);
return e;
}
void pushReturnValue(unsigned code, ir::Value* result)
2014-05-01 19:56:39 +00:00
{
switch (code) {
case ByteField:
case BooleanField:
case CharField:
case ShortField:
case IntField:
2014-06-01 20:22:14 +00:00
return push(ir::Type::i4(), result);
2014-05-02 15:01:57 +00:00
case FloatField:
2014-06-01 20:22:14 +00:00
return push(ir::Type::f4(), result);
case ObjectField:
2014-06-01 20:22:14 +00:00
return push(ir::Type::object(), result);
case LongField:
2014-06-01 20:22:14 +00:00
return pushLarge(ir::Type::i8(), result);
2014-05-02 15:01:57 +00:00
case DoubleField:
2014-06-01 20:22:14 +00:00
return pushLarge(ir::Type::f8(), result);
default:
abort(t);
}
}
2014-05-01 19:56:39 +00:00
Slice<ir::Value*> peekMethodArguments(unsigned footprint)
{
ir::Value** ptr = context->argumentBuffer.items;
for (unsigned i = 0; i < footprint; i++) {
*(ptr++) = c->peek(1, footprint - i - 1);
}
return Slice<ir::Value*>(context->argumentBuffer.items, footprint);
}
void stackCall(ir::Value* methodValue,
2014-05-29 04:17:25 +00:00
GcMethod* methodObject,
unsigned flags,
TraceElement* trace)
{
2014-05-29 04:17:25 +00:00
unsigned footprint = methodObject->parameterFootprint();
unsigned returnCode = methodObject->returnCode();
ir::Value* result = c->stackCall(methodValue,
flags,
trace,
operandTypeForFieldCode(t, returnCode),
peekMethodArguments(footprint));
2014-06-01 20:22:14 +00:00
popFootprint(footprint);
if (returnCode != VoidField) {
pushReturnValue(returnCode, result);
}
2014-05-01 19:56:39 +00:00
}
2014-05-01 20:30:45 +00:00
void referenceStackCall(bool isStatic,
ir::Value* methodValue,
2014-06-29 04:57:07 +00:00
GcReference* methodReference,
2014-05-01 20:30:45 +00:00
unsigned flags,
TraceElement* trace)
{
unsigned footprint
= methodReferenceParameterFootprint(t, methodReference, isStatic);
unsigned returnCode = methodReferenceReturnCode(t, methodReference);
ir::Value* result = c->stackCall(methodValue,
flags,
trace,
operandTypeForFieldCode(t, returnCode),
peekMethodArguments(footprint));
2014-05-01 20:30:45 +00:00
2014-06-01 20:22:14 +00:00
popFootprint(footprint);
2014-05-01 20:30:45 +00:00
if (returnCode != VoidField) {
pushReturnValue(returnCode, result);
}
}
void startSubroutine(unsigned ip, unsigned returnAddress)
{
// Push a dummy value to the stack, representing the return address (which
// we don't need, since we're expanding everything statically).
// TODO: in the future, push a value that we can track through type checking
2014-06-01 20:22:14 +00:00
push(ir::Type::object(), c->constant(0, ir::Type::object()));
if (DebugInstructions) {
fprintf(stderr, "startSubroutine %u %u\n", ip, returnAddress);
}
Subroutine* subroutine = new (&context->zone)
Subroutine(context->subroutineCount++,
returnAddress,
2014-06-28 04:00:05 +00:00
context->method->code()->length(),
this->subroutine);
2014-06-28 04:00:05 +00:00
context->extendLogicalCode(context->method->code()->length());
this->subroutine = subroutine;
}
unsigned endSubroutine(unsigned returnAddressLocal UNUSED)
{
// TODO: use returnAddressLocal to decide which subroutine we're returning
// from (in case it's ever not the most recent one entered). I'm unsure of
// whether such a subroutine pattern would pass bytecode verification.
unsigned returnAddress = subroutine->returnAddress;
if (DebugInstructions) {
fprintf(stderr, "endSubroutine %u %u\n", ip, returnAddress);
}
2009-07-08 14:18:40 +00:00
subroutine = subroutine->outer;
return returnAddress;
}
Context* context;
2007-12-09 22:45:43 +00:00
MyThread* t;
avian::codegen::Compiler* c;
// Innermost subroutine we're compiling code for
Subroutine* subroutine;
2014-05-05 16:49:50 +00:00
ir::Type* stackMap;
2007-12-09 22:45:43 +00:00
unsigned ip;
unsigned sp;
2008-01-07 14:51:07 +00:00
unsigned level;
2007-12-30 22:24:48 +00:00
};
2014-07-11 15:47:57 +00:00
unsigned savedTargetIndex(MyThread* t UNUSED, GcMethod* method)
{
2014-06-28 04:00:05 +00:00
return method->code()->maxLocals();
}
2014-07-11 15:47:57 +00:00
GcCallNode* findCallNode(MyThread* t, void* address);
2014-07-11 15:47:57 +00:00
void* findExceptionHandler(Thread* t, GcMethod* method, void* ip)
{
2009-05-03 20:57:11 +00:00
if (t->exception) {
2014-06-29 04:57:07 +00:00
GcArray* table = cast<GcArray>(t, method->code()->exceptionHandlerTable());
2009-05-03 20:57:11 +00:00
if (table) {
2014-06-29 04:57:07 +00:00
GcIntArray* index = cast<GcIntArray>(t, table->body()[0]);
2014-05-29 04:17:25 +00:00
2014-07-11 15:50:18 +00:00
uint8_t* compiled = reinterpret_cast<uint8_t*>(methodCompiled(t, method));
2014-06-29 04:57:07 +00:00
for (unsigned i = 0; i < table->length() - 1; ++i) {
unsigned start = index->body()[i * 3];
unsigned end = index->body()[(i * 3) + 1];
2009-05-03 20:57:11 +00:00
unsigned key = difference(ip, compiled) - 1;
2009-05-03 20:57:11 +00:00
if (key >= start and key < end) {
2014-06-29 04:57:07 +00:00
GcClass* catchType = cast<GcClass>(t, table->body()[i + 1]);
if (exceptionMatch(t, catchType, t->exception)) {
2014-06-29 04:57:07 +00:00
return compiled + index->body()[(i * 3) + 2];
2009-05-03 20:57:11 +00:00
}
}
}
}
}
return 0;
}
2014-07-11 15:47:57 +00:00
void releaseLock(MyThread* t, GcMethod* method, void* stack)
2009-05-03 20:57:11 +00:00
{
2014-05-29 04:17:25 +00:00
if (method->flags() & ACC_SYNCHRONIZED) {
if (t->methodLockIsClean) {
object lock;
2014-05-29 04:17:25 +00:00
if (method->flags() & ACC_STATIC) {
lock = method->class_();
} else {
2014-07-11 15:50:18 +00:00
lock = *localObject(t,
stackForFrame(t, stack, method),
method,
savedTargetIndex(t, method));
}
2014-05-29 04:17:25 +00:00
release(t, lock);
2009-05-03 20:57:11 +00:00
} else {
// got an exception while trying to acquire the lock for a
// synchronized method -- don't try to release it, since we
// never succeeded in acquiring it.
t->methodLockIsClean = true;
2009-05-03 20:57:11 +00:00
}
}
}
2014-07-11 15:47:57 +00:00
void findUnwindTarget(MyThread* t,
void** targetIp,
void** targetFrame,
void** targetStack,
GcContinuation** targetContinuation)
2007-09-29 21:08:29 +00:00
{
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
void* ip;
void* stack;
2014-06-29 03:50:32 +00:00
GcContinuation* continuation;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
if (t->traceContext) {
ip = t->traceContext->ip;
stack = t->traceContext->stack;
continuation = t->traceContext->continuation;
} else {
ip = getIp(t);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
stack = t->stack;
2014-05-29 04:17:25 +00:00
continuation = t->continuation;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
}
2014-05-29 04:17:25 +00:00
GcMethod* target = t->trace->targetMethod;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
bool mostRecent = true;
2009-05-17 00:39:08 +00:00
*targetIp = 0;
while (*targetIp == 0) {
2014-05-29 04:17:25 +00:00
GcMethod* method = methodForIp(t, ip);
if (method) {
void* handler = findExceptionHandler(t, method, ip);
2007-12-09 22:45:43 +00:00
if (handler) {
*targetIp = handler;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
nextFrame(t, &ip, &stack, method, target, mostRecent);
void** sp = static_cast<void**>(stackForFrame(t, stack, method))
2014-07-11 15:50:18 +00:00
+ t->arch->frameReturnAddressSize();
2007-10-04 22:41:19 +00:00
2014-07-11 15:50:18 +00:00
*targetFrame = static_cast<void**>(stack)
+ t->arch->framePointerOffset();
*targetStack = sp;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
*targetContinuation = continuation;
2009-05-17 23:43:48 +00:00
sp[localOffset(t, localSize(t, method), method)] = t->exception;
2007-10-04 22:41:19 +00:00
t->exception = 0;
2007-12-09 22:45:43 +00:00
} else {
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
nextFrame(t, &ip, &stack, method, target, mostRecent);
2009-05-23 22:15:06 +00:00
if (t->exception) {
releaseLock(t, method, stack);
}
2009-05-17 00:39:08 +00:00
target = method;
2009-05-03 20:57:11 +00:00
}
} else {
expect(t, ip);
2009-05-03 20:57:11 +00:00
*targetIp = ip;
*targetFrame = 0;
2009-05-03 20:57:11 +00:00
*targetStack = static_cast<void**>(stack)
2014-07-11 15:50:18 +00:00
+ t->arch->frameReturnAddressSize();
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
*targetContinuation = continuation;
2009-05-03 20:57:11 +00:00
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
while (Continuations and *targetContinuation) {
2014-06-29 03:50:32 +00:00
GcContinuation* c = *targetContinuation;
2009-05-25 04:27:50 +00:00
2014-06-29 03:50:32 +00:00
GcMethod* method = c->method();
2009-05-17 00:39:08 +00:00
2014-07-11 15:47:57 +00:00
void* handler = findExceptionHandler(t, method, c->address());
2009-05-03 20:57:11 +00:00
if (handler) {
t->exceptionHandler = handler;
2014-05-29 04:17:25 +00:00
t->exceptionStackAdjustment
2014-07-11 15:47:57 +00:00
= (stackOffsetFromFrame(t, method)
- ((c->framePointerOffset() / BytesPerWord)
- t->arch->framePointerOffset()
+ t->arch->frameReturnAddressSize())) * BytesPerWord;
2009-05-03 20:57:11 +00:00
2014-07-11 15:50:18 +00:00
t->exceptionOffset = localOffset(t, localSize(t, method), method)
* BytesPerWord;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
2009-05-03 20:57:11 +00:00
break;
2009-05-23 22:15:06 +00:00
} else if (t->exception) {
2014-07-11 15:47:57 +00:00
releaseLock(t,
method,
reinterpret_cast<uint8_t*>(c) + ContinuationBody
2014-06-29 03:50:32 +00:00
+ c->returnAddressOffset()
- t->arch->returnAddressOffset());
}
2009-05-03 20:57:11 +00:00
2014-06-29 03:50:32 +00:00
*targetContinuation = c->next();
2009-05-03 20:57:11 +00:00
}
}
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
mostRecent = false;
2009-05-03 20:57:11 +00:00
}
}
2014-07-11 15:47:57 +00:00
GcContinuation* makeCurrentContinuation(MyThread* t,
void** targetIp,
void** targetStack)
2009-05-03 20:57:11 +00:00
{
void* ip = getIp(t);
2009-05-03 20:57:11 +00:00
void* stack = t->stack;
2014-07-11 15:47:57 +00:00
GcContinuationContext* context
= t->continuation
? t->continuation->context()
: makeContinuationContext(t, 0, 0, 0, 0, t->trace->originalMethod);
2009-05-25 04:27:50 +00:00
PROTECT(t, context);
2014-05-29 04:17:25 +00:00
GcMethod* target = t->trace->targetMethod;
2009-05-03 20:57:11 +00:00
PROTECT(t, target);
2014-06-29 03:50:32 +00:00
GcContinuation* first = 0;
2009-05-03 20:57:11 +00:00
PROTECT(t, first);
2014-06-29 03:50:32 +00:00
GcContinuation* last = 0;
2009-05-03 20:57:11 +00:00
PROTECT(t, last);
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
bool mostRecent = true;
2009-05-03 20:57:11 +00:00
*targetIp = 0;
while (*targetIp == 0) {
2014-05-29 04:17:25 +00:00
GcMethod* method = methodForIp(t, ip);
2009-05-03 20:57:11 +00:00
if (method) {
PROTECT(t, method);
void** top = static_cast<void**>(stack)
2014-07-11 15:50:18 +00:00
+ t->arch->frameReturnAddressSize()
+ t->arch->frameFooterSize();
2009-05-03 20:57:11 +00:00
unsigned argumentFootprint
2014-07-11 15:47:57 +00:00
= t->arch->argumentFootprint(target->parameterFootprint());
2009-05-03 20:57:11 +00:00
unsigned alignment = t->arch->stackAlignmentInWords();
if (avian::codegen::TailCalls and argumentFootprint > alignment) {
2009-05-03 20:57:11 +00:00
top += argumentFootprint - alignment;
}
void* nextIp = ip;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
nextFrame(t, &nextIp, &stack, method, target, mostRecent);
2009-05-03 20:57:11 +00:00
void** bottom = static_cast<void**>(stack)
2014-07-11 15:50:18 +00:00
+ t->arch->frameReturnAddressSize();
2009-05-03 20:57:11 +00:00
unsigned frameSize = bottom - top;
2014-07-11 15:47:57 +00:00
unsigned totalSize
= frameSize + t->arch->frameFooterSize()
+ t->arch->argumentFootprint(method->parameterFootprint());
GcContinuation* c = makeContinuation(
t,
0,
context,
method,
ip,
(frameSize + t->arch->frameFooterSize()
+ t->arch->returnAddressOffset() - t->arch->frameReturnAddressSize())
* BytesPerWord,
(frameSize + t->arch->frameFooterSize()
+ t->arch->framePointerOffset() - t->arch->frameReturnAddressSize())
* BytesPerWord,
totalSize);
2009-05-03 20:57:11 +00:00
2014-06-29 03:50:32 +00:00
memcpy(c->body().begin(), top, totalSize * BytesPerWord);
2009-05-03 20:57:11 +00:00
if (last) {
2014-06-25 20:38:13 +00:00
last->setNext(t, c);
2009-05-03 20:57:11 +00:00
} else {
first = c;
}
2009-05-03 20:57:11 +00:00
last = c;
ip = nextIp;
2009-05-03 20:57:11 +00:00
target = method;
2007-10-12 22:06:33 +00:00
} else {
*targetIp = ip;
*targetStack = static_cast<void**>(stack)
2014-07-11 15:50:18 +00:00
+ t->arch->frameReturnAddressSize();
}
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
mostRecent = false;
}
2009-05-03 20:57:11 +00:00
expect(t, last);
2014-06-25 20:38:13 +00:00
last->setNext(t, t->continuation);
2009-05-03 20:57:11 +00:00
return first;
}
2014-07-11 15:50:18 +00:00
void NO_RETURN unwind(MyThread* t)
{
void* ip;
void* frame;
void* stack;
2014-06-29 03:50:32 +00:00
GcContinuation* continuation;
findUnwindTarget(t, &ip, &frame, &stack, &continuation);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
t->trace->targetMethod = 0;
t->trace->nativeMethod = 0;
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
transition(t, ip, stack, continuation, t->trace);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
vmJump(ip, frame, stack, t, 0, 0);
}
2014-07-11 15:50:18 +00:00
class MyCheckpoint : public Thread::Checkpoint {
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
public:
2014-07-11 15:50:18 +00:00
MyCheckpoint(MyThread* t) : Checkpoint(t)
{
}
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
2014-07-11 15:50:18 +00:00
virtual void unwind()
{
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
local::unwind(static_cast<MyThread*>(t));
}
};
2014-07-11 15:50:18 +00:00
uintptr_t defaultThunk(MyThread* t);
2008-12-02 02:38:00 +00:00
2014-07-11 15:50:18 +00:00
uintptr_t nativeThunk(MyThread* t);
2008-12-02 02:38:00 +00:00
2014-07-11 15:50:18 +00:00
uintptr_t bootNativeThunk(MyThread* t);
2014-07-11 15:50:18 +00:00
uintptr_t virtualThunk(MyThread* t, unsigned index);
2014-07-11 15:50:18 +00:00
bool unresolved(MyThread* t, uintptr_t methodAddress);
2014-07-11 15:47:57 +00:00
uintptr_t methodAddress(Thread* t, GcMethod* method)
2008-12-02 02:38:00 +00:00
{
2014-05-29 04:17:25 +00:00
if (method->flags() & ACC_NATIVE) {
return bootNativeThunk(static_cast<MyThread*>(t));
2008-12-02 02:38:00 +00:00
} else {
return methodCompiled(t, method);
}
}
2014-07-11 15:47:57 +00:00
void tryInitClass(MyThread* t, GcClass* class_)
{
initClass(t, class_);
}
2014-07-11 15:47:57 +00:00
void compile(MyThread* t,
FixedAllocator* allocator,
BootContext* bootContext,
GcMethod* method);
2014-07-11 15:47:57 +00:00
GcMethod* resolveMethod(Thread* t, GcPair* pair)
{
2014-06-29 04:57:07 +00:00
GcReference* reference = cast<GcReference>(t, pair->second());
PROTECT(t, reference);
2014-07-11 15:47:57 +00:00
GcClass* class_ = resolveClassInObject(
t,
cast<GcMethod>(t, pair->first())->class_()->loader(),
reference,
ReferenceClass);
2014-07-11 15:47:57 +00:00
return cast<GcMethod>(t,
findInHierarchy(t,
class_,
reference->name(),
reference->spec(),
findMethodInClass,
GcNoSuchMethodError::Type));
}
2014-07-11 15:47:57 +00:00
bool methodAbstract(Thread* t UNUSED, GcMethod* method)
{
2014-07-11 15:47:57 +00:00
return method->code() == 0 and (method->flags() & ACC_NATIVE) == 0;
}
2014-07-11 15:47:57 +00:00
int64_t prepareMethodForCall(MyThread* t, GcMethod* target)
{
if (methodAbstract(t, target)) {
2014-07-11 15:47:57 +00:00
throwNew(t,
GcAbstractMethodError::Type,
"%s.%s%s",
target->class_()->name()->body().begin(),
target->name()->body().begin(),
target->spec()->body().begin());
2014-05-29 04:17:25 +00:00
} else {
if (unresolved(t, methodAddress(t, target))) {
PROTECT(t, target);
2014-05-29 04:17:25 +00:00
compile(t, codeAllocator(t), 0, target);
}
2014-05-29 04:17:25 +00:00
if (target->flags() & ACC_NATIVE) {
t->trace->nativeMethod = target;
}
return methodAddress(t, target);
}
}
2014-07-11 15:47:57 +00:00
int64_t findInterfaceMethodFromInstance(MyThread* t,
GcMethod* method,
object instance)
{
if (instance) {
2014-07-11 15:50:18 +00:00
return prepareMethodForCall(
t, findInterfaceMethod(t, method, objectClass(t, instance)));
2007-12-30 22:24:48 +00:00
} else {
2014-05-29 04:17:25 +00:00
throwNew(t, GcNullPointerException::Type);
2007-12-30 22:24:48 +00:00
}
}
2014-07-11 15:47:57 +00:00
int64_t findInterfaceMethodFromInstanceAndReference(MyThread* t,
GcPair* pair,
object instance)
{
PROTECT(t, instance);
2014-05-29 04:17:25 +00:00
GcMethod* method = resolveMethod(t, pair);
return findInterfaceMethodFromInstance(t, method, instance);
}
2014-07-11 15:47:57 +00:00
void checkMethod(Thread* t, GcMethod* method, bool shouldBeStatic)
{
2014-05-29 04:17:25 +00:00
if (((method->flags() & ACC_STATIC) == 0) == shouldBeStatic) {
2014-07-11 15:47:57 +00:00
throwNew(t,
GcIncompatibleClassChangeError::Type,
"expected %s.%s%s to be %s",
method->class_()->name()->body().begin(),
method->name()->body().begin(),
method->spec()->body().begin(),
shouldBeStatic ? "static" : "non-static");
}
}
2014-07-11 15:47:57 +00:00
int64_t findSpecialMethodFromReference(MyThread* t, GcPair* pair)
{
PROTECT(t, pair);
2014-05-29 04:17:25 +00:00
GcMethod* target = resolveMethod(t, pair);
2014-06-29 04:57:07 +00:00
GcClass* class_ = cast<GcMethod>(t, pair->first())->class_();
if (isSpecialMethod(t, target, class_)) {
target = findVirtualMethod(t, target, class_->super());
}
checkMethod(t, target, false);
return prepareMethodForCall(t, target);
}
2014-07-11 15:47:57 +00:00
int64_t findStaticMethodFromReference(MyThread* t, GcPair* pair)
{
2014-05-29 04:17:25 +00:00
GcMethod* target = resolveMethod(t, pair);
checkMethod(t, target, true);
return prepareMethodForCall(t, target);
}
2014-07-11 15:47:57 +00:00
int64_t findVirtualMethodFromReference(MyThread* t,
GcPair* pair,
object instance)
{
PROTECT(t, instance);
2014-05-29 04:17:25 +00:00
GcMethod* target = resolveMethod(t, pair);
target = findVirtualMethod(t, target, objectClass(t, instance));
checkMethod(t, target, false);
return prepareMethodForCall(t, target);
}
2014-07-11 15:47:57 +00:00
int64_t getMethodAddress(MyThread* t, GcMethod* target)
{
return prepareMethodForCall(t, target);
}
2014-07-11 15:47:57 +00:00
int64_t getJClassFromReference(MyThread* t, GcPair* pair)
{
2014-05-29 04:17:25 +00:00
return reinterpret_cast<intptr_t>(getJClass(
t,
resolveClass(t,
2014-07-11 15:47:57 +00:00
cast<GcMethod>(t, pair->first())->class_()->loader(),
cast<GcReference>(t, pair->second())->name())));
}
2014-07-11 15:50:18 +00:00
unsigned traceSize(Thread* t)
{
2014-07-11 15:50:18 +00:00
class Counter : public Processor::StackVisitor {
public:
2014-07-11 15:50:18 +00:00
Counter() : count(0)
{
}
2014-07-11 15:50:18 +00:00
virtual bool visit(Processor::StackWalker*)
{
++count;
return true;
}
unsigned count;
} counter;
t->m->processor->walkStack(t, &counter);
2014-07-11 15:47:57 +00:00
return pad(GcArray::FixedSize)
+ (counter.count * pad(ArrayElementSizeOfArray))
+ (counter.count * pad(GcTraceElement::FixedSize));
}
2014-07-11 15:50:18 +00:00
void NO_RETURN throwArithmetic(MyThread* t)
{
2014-05-29 04:17:25 +00:00
if (ensure(t, GcArithmeticException::FixedSize + traceSize(t))) {
t->setFlag(Thread::TracingFlag);
THREAD_RESOURCE0(t, t->clearFlag(Thread::TracingFlag));
2014-05-29 04:17:25 +00:00
throwNew(t, GcArithmeticException::Type);
} else {
// not enough memory available for a new exception and stack trace
// -- use a preallocated instance instead
2014-06-30 01:44:41 +00:00
throw_(t, roots(t)->arithmeticException());
}
}
int64_t divideLong(MyThread* t, int64_t b, int64_t a)
{
if (LIKELY(b)) {
return a / b;
} else {
throwArithmetic(t);
}
}
int64_t divideInt(MyThread* t, int32_t b, int32_t a)
2009-10-29 16:12:30 +00:00
{
if (LIKELY(b)) {
return a / b;
} else {
throwArithmetic(t);
}
2009-10-29 16:12:30 +00:00
}
int64_t moduloLong(MyThread* t, int64_t b, int64_t a)
{
if (LIKELY(b)) {
return a % b;
} else {
throwArithmetic(t);
}
}
int64_t moduloInt(MyThread* t, int32_t b, int32_t a)
{
if (LIKELY(b)) {
return a % b;
} else {
throwArithmetic(t);
}
2009-10-29 20:14:44 +00:00
}
2014-07-11 15:47:57 +00:00
uint64_t makeBlankObjectArray(MyThread* t, GcClass* class_, int32_t length)
2007-09-30 02:48:27 +00:00
{
if (length >= 0) {
return reinterpret_cast<uint64_t>(makeObjectArray(t, class_, length));
} else {
2014-05-29 04:17:25 +00:00
throwNew(t, GcNegativeArraySizeException::Type, "%d", length);
}
2007-09-30 02:48:27 +00:00
}
2014-07-11 15:47:57 +00:00
uint64_t makeBlankObjectArrayFromReference(MyThread* t,
GcPair* pair,
int32_t length)
{
2014-05-29 04:17:25 +00:00
return makeBlankObjectArray(
t,
resolveClass(t,
2014-07-11 15:47:57 +00:00
cast<GcMethod>(t, pair->first())->class_()->loader(),
cast<GcReference>(t, pair->second())->name()),
2014-05-29 04:17:25 +00:00
length);
}
2014-07-11 15:50:18 +00:00
uint64_t makeBlankArray(MyThread* t, unsigned type, int32_t length)
2007-09-30 02:48:27 +00:00
{
if (length >= 0) {
2008-11-30 01:39:42 +00:00
switch (type) {
case T_BOOLEAN:
2014-05-29 04:17:25 +00:00
return reinterpret_cast<uintptr_t>(makeBooleanArray(t, length));
2008-11-30 01:39:42 +00:00
case T_CHAR:
2014-05-29 04:17:25 +00:00
return reinterpret_cast<uintptr_t>(makeCharArray(t, length));
2008-11-30 01:39:42 +00:00
case T_FLOAT:
2014-05-29 04:17:25 +00:00
return reinterpret_cast<uintptr_t>(makeFloatArray(t, length));
2008-11-30 01:39:42 +00:00
case T_DOUBLE:
2014-05-29 04:17:25 +00:00
return reinterpret_cast<uintptr_t>(makeDoubleArray(t, length));
2008-11-30 01:39:42 +00:00
case T_BYTE:
2014-05-29 04:17:25 +00:00
return reinterpret_cast<uintptr_t>(makeByteArray(t, length));
2008-11-30 01:39:42 +00:00
case T_SHORT:
2014-05-29 04:17:25 +00:00
return reinterpret_cast<uintptr_t>(makeShortArray(t, length));
2008-11-30 01:39:42 +00:00
case T_INT:
2014-05-29 04:17:25 +00:00
return reinterpret_cast<uintptr_t>(makeIntArray(t, length));
2008-11-30 01:39:42 +00:00
case T_LONG:
2014-05-29 04:17:25 +00:00
return reinterpret_cast<uintptr_t>(makeLongArray(t, length));
2014-07-11 15:50:18 +00:00
default:
abort(t);
2008-11-30 01:39:42 +00:00
}
} else {
2014-05-29 04:17:25 +00:00
throwNew(t, GcNegativeArraySizeException::Type, "%d", length);
}
2007-09-30 02:48:27 +00:00
}
2014-07-11 15:50:18 +00:00
uint64_t lookUpAddress(int32_t key,
uintptr_t* start,
int32_t count,
uintptr_t default_)
{
2007-12-09 22:45:43 +00:00
int32_t bottom = 0;
int32_t top = count;
for (int32_t span = top - bottom; span; span = top - bottom) {
int32_t middle = bottom + (span / 2);
uintptr_t* p = start + (middle * 2);
int32_t k = *p;
if (key < k) {
top = middle;
} else if (key > k) {
bottom = middle + 1;
} else {
return p[1];
}
}
return default_;
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:50:18 +00:00
void setMaybeNull(MyThread* t, object o, unsigned offset, object value)
2007-12-09 22:45:43 +00:00
{
if (LIKELY(o)) {
2014-06-26 02:17:27 +00:00
setField(t, o, offset, value);
2007-12-30 22:24:48 +00:00
} else {
2014-05-29 04:17:25 +00:00
throwNew(t, GcNullPointerException::Type);
2007-12-30 22:24:48 +00:00
}
}
2014-07-11 15:50:18 +00:00
void acquireMonitorForObject(MyThread* t, object o)
2007-12-30 22:24:48 +00:00
{
if (LIKELY(o)) {
2007-12-30 22:24:48 +00:00
acquire(t, o);
} else {
2014-05-29 04:17:25 +00:00
throwNew(t, GcNullPointerException::Type);
2007-12-30 22:24:48 +00:00
}
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:50:18 +00:00
void acquireMonitorForObjectOnEntrance(MyThread* t, object o)
{
if (LIKELY(o)) {
t->methodLockIsClean = false;
acquire(t, o);
t->methodLockIsClean = true;
} else {
2014-05-29 04:17:25 +00:00
throwNew(t, GcNullPointerException::Type);
}
}
2014-07-11 15:50:18 +00:00
void releaseMonitorForObject(MyThread* t, object o)
2007-12-09 22:45:43 +00:00
{
if (LIKELY(o)) {
2007-12-30 22:24:48 +00:00
release(t, o);
} else {
2014-05-29 04:17:25 +00:00
throwNew(t, GcNullPointerException::Type);
2007-12-30 22:24:48 +00:00
}
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:47:57 +00:00
object makeMultidimensionalArray2(MyThread* t,
GcClass* class_,
uintptr_t* countStack,
int32_t dimensions)
2007-12-09 22:45:43 +00:00
{
PROTECT(t, class_);
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RUNTIME_ARRAY(t, int32_t, counts, dimensions);
2007-12-09 22:45:43 +00:00
for (int i = dimensions - 1; i >= 0; --i) {
RUNTIME_ARRAY_BODY(counts)[i] = countStack[dimensions - i - 1];
if (UNLIKELY(RUNTIME_ARRAY_BODY(counts)[i] < 0)) {
2014-07-11 15:47:57 +00:00
throwNew(t,
GcNegativeArraySizeException::Type,
"%d",
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
RUNTIME_ARRAY_BODY(counts)[i]);
2007-12-09 22:45:43 +00:00
return 0;
}
}
object array = makeArray(t, RUNTIME_ARRAY_BODY(counts)[0]);
2007-12-09 22:45:43 +00:00
setObjectClass(t, array, class_);
PROTECT(t, array);
populateMultiArray(t, array, RUNTIME_ARRAY_BODY(counts), 0, dimensions);
2007-12-09 22:45:43 +00:00
return array;
}
2014-07-11 15:47:57 +00:00
uint64_t makeMultidimensionalArray(MyThread* t,
GcClass* class_,
int32_t dimensions,
int32_t offset)
{
2014-07-11 15:50:18 +00:00
return reinterpret_cast<uintptr_t>(makeMultidimensionalArray2(
t, class_, static_cast<uintptr_t*>(t->stack) + offset, dimensions));
}
2014-07-11 15:47:57 +00:00
uint64_t makeMultidimensionalArrayFromReference(MyThread* t,
GcPair* pair,
int32_t dimensions,
int32_t offset)
{
2014-07-11 15:47:57 +00:00
return makeMultidimensionalArray(
t,
resolveClass(t,
cast<GcMethod>(t, pair->first())->class_()->loader(),
cast<GcReference>(t, pair->second())->name()),
dimensions,
offset);
}
2014-07-11 15:50:18 +00:00
void NO_RETURN throwArrayIndexOutOfBounds(MyThread* t)
{
2014-05-29 04:17:25 +00:00
if (ensure(t, GcArrayIndexOutOfBoundsException::FixedSize + traceSize(t))) {
t->setFlag(Thread::TracingFlag);
THREAD_RESOURCE0(t, t->clearFlag(Thread::TracingFlag));
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
2014-05-29 04:17:25 +00:00
throwNew(t, GcArrayIndexOutOfBoundsException::Type);
} else {
// not enough memory available for a new exception and stack trace
// -- use a preallocated instance instead
2014-06-30 01:44:41 +00:00
throw_(t, roots(t)->arrayIndexOutOfBoundsException());
}
}
2014-07-11 15:50:18 +00:00
void NO_RETURN throwStackOverflow(MyThread* t)
{
2014-05-29 04:17:25 +00:00
throwNew(t, GcStackOverflowError::Type);
}
2014-07-11 15:47:57 +00:00
void NO_RETURN throw_(MyThread* t, GcThrowable* o)
2007-10-09 17:15:40 +00:00
{
if (LIKELY(o)) {
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
vm::throw_(t, o);
2007-12-09 22:45:43 +00:00
} else {
2014-05-29 04:17:25 +00:00
throwNew(t, GcNullPointerException::Type);
}
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:47:57 +00:00
void checkCast(MyThread* t, GcClass* class_, object o)
{
if (UNLIKELY(o and not isAssignableFrom(t, class_, objectClass(t, o)))) {
2014-06-29 04:57:07 +00:00
GcByteArray* classNameFrom = objectClass(t, o)->name();
2014-07-11 15:47:57 +00:00
GcByteArray* classNameTo = class_->name();
2014-06-29 04:57:07 +00:00
THREAD_RUNTIME_ARRAY(t, char, classFrom, classNameFrom->length());
2014-07-11 15:47:57 +00:00
THREAD_RUNTIME_ARRAY(t, char, classTo, classNameTo->length());
replace('/',
'.',
RUNTIME_ARRAY_BODY(classFrom),
2014-06-29 04:57:07 +00:00
reinterpret_cast<char*>(classNameFrom->body().begin()));
2014-07-11 15:47:57 +00:00
replace('/',
'.',
RUNTIME_ARRAY_BODY(classTo),
2014-06-28 23:24:24 +00:00
reinterpret_cast<char*>(classNameTo->body().begin()));
2014-07-11 15:47:57 +00:00
throwNew(t,
GcClassCastException::Type,
"%s cannot be cast to %s",
RUNTIME_ARRAY_BODY(classFrom),
RUNTIME_ARRAY_BODY(classTo));
}
}
2014-07-11 15:47:57 +00:00
void checkCastFromReference(MyThread* t, GcPair* pair, object o)
{
PROTECT(t, o);
2014-07-11 15:47:57 +00:00
GcClass* c
= resolveClass(t,
cast<GcMethod>(t, pair->first())->class_()->loader(),
cast<GcReference>(t, pair->second())->name());
checkCast(t, c, o);
}
2014-07-11 15:47:57 +00:00
GcField* resolveField(Thread* t, GcPair* pair)
{
2014-06-29 04:57:07 +00:00
GcReference* reference = cast<GcReference>(t, pair->second());
PROTECT(t, reference);
2014-07-11 15:47:57 +00:00
GcClass* class_ = resolveClassInObject(
t,
cast<GcMethod>(t, pair->first())->class_()->loader(),
reference,
ReferenceClass);
2014-07-11 15:47:57 +00:00
return cast<GcField>(t,
findInHierarchy(t,
class_,
reference->name(),
reference->spec(),
findFieldInClass,
GcNoSuchFieldError::Type));
}
2014-07-11 15:47:57 +00:00
uint64_t getFieldValue(Thread* t, object target, GcField* field)
{
2014-06-29 04:57:07 +00:00
switch (field->code()) {
case ByteField:
case BooleanField:
2014-06-29 04:57:07 +00:00
return fieldAtOffset<int8_t>(target, field->offset());
case CharField:
case ShortField:
2014-06-29 04:57:07 +00:00
return fieldAtOffset<int16_t>(target, field->offset());
case FloatField:
case IntField:
2014-06-29 04:57:07 +00:00
return fieldAtOffset<int32_t>(target, field->offset());
case DoubleField:
case LongField:
2014-06-29 04:57:07 +00:00
return fieldAtOffset<int64_t>(target, field->offset());
case ObjectField:
2014-06-29 04:57:07 +00:00
return fieldAtOffset<intptr_t>(target, field->offset());
default:
abort(t);
}
}
2014-07-11 15:47:57 +00:00
uint64_t getStaticFieldValueFromReference(MyThread* t, GcPair* pair)
{
2014-06-29 04:57:07 +00:00
GcField* field = resolveField(t, pair);
PROTECT(t, field);
2014-06-29 04:57:07 +00:00
initClass(t, field->class_());
2014-06-29 04:57:07 +00:00
ACQUIRE_FIELD_FOR_READ(t, field);
return getFieldValue(t, field->class_()->staticTable(), field);
}
2014-07-11 15:47:57 +00:00
uint64_t getFieldValueFromReference(MyThread* t, GcPair* pair, object instance)
{
PROTECT(t, instance);
2014-06-29 04:57:07 +00:00
GcField* field = resolveField(t, pair);
PROTECT(t, field);
2014-06-29 04:57:07 +00:00
ACQUIRE_FIELD_FOR_READ(t, field);
return getFieldValue(t, instance, field);
}
2014-07-11 15:47:57 +00:00
void setStaticLongFieldValueFromReference(MyThread* t,
GcPair* pair,
uint64_t value)
{
2014-06-29 04:57:07 +00:00
GcField* field = resolveField(t, pair);
PROTECT(t, field);
2014-06-29 04:57:07 +00:00
initClass(t, field->class_());
2014-06-29 04:57:07 +00:00
ACQUIRE_FIELD_FOR_WRITE(t, field);
2014-07-11 15:47:57 +00:00
fieldAtOffset<int64_t>(field->class_()->staticTable(), field->offset())
= value;
}
2014-07-11 15:47:57 +00:00
void setLongFieldValueFromReference(MyThread* t,
GcPair* pair,
object instance,
uint64_t value)
{
PROTECT(t, instance);
2014-06-29 04:57:07 +00:00
GcField* field = resolveField(t, pair);
PROTECT(t, field);
2014-06-29 04:57:07 +00:00
ACQUIRE_FIELD_FOR_WRITE(t, field);
2014-06-29 04:57:07 +00:00
fieldAtOffset<int64_t>(instance, field->offset()) = value;
}
2014-07-11 15:47:57 +00:00
void setStaticObjectFieldValueFromReference(MyThread* t,
GcPair* pair,
object value)
{
PROTECT(t, value);
2014-06-29 04:57:07 +00:00
GcField* field = resolveField(t, pair);
PROTECT(t, field);
2014-06-29 04:57:07 +00:00
initClass(t, field->class_());
2014-06-29 04:57:07 +00:00
ACQUIRE_FIELD_FOR_WRITE(t, field);
2014-07-11 15:47:57 +00:00
setField(t, field->class_()->staticTable(), field->offset(), value);
}
2014-07-11 15:47:57 +00:00
void setObjectFieldValueFromReference(MyThread* t,
GcPair* pair,
object instance,
object value)
{
PROTECT(t, instance);
PROTECT(t, value);
2014-06-29 04:57:07 +00:00
GcField* field = resolveField(t, pair);
PROTECT(t, field);
2014-06-29 04:57:07 +00:00
ACQUIRE_FIELD_FOR_WRITE(t, field);
2014-06-26 02:17:27 +00:00
setField(t, instance, field->offset(), value);
}
2014-07-11 15:47:57 +00:00
void setFieldValue(MyThread* t, object target, GcField* field, uint32_t value)
{
2014-06-29 04:57:07 +00:00
switch (field->code()) {
case ByteField:
case BooleanField:
2014-06-29 04:57:07 +00:00
fieldAtOffset<int8_t>(target, field->offset()) = value;
break;
case CharField:
case ShortField:
2014-06-29 04:57:07 +00:00
fieldAtOffset<int16_t>(target, field->offset()) = value;
break;
case FloatField:
case IntField:
2014-06-29 04:57:07 +00:00
fieldAtOffset<int32_t>(target, field->offset()) = value;
break;
default:
abort(t);
}
}
2014-07-11 15:47:57 +00:00
void setStaticFieldValueFromReference(MyThread* t, GcPair* pair, uint32_t value)
{
2014-06-29 04:57:07 +00:00
GcField* field = resolveField(t, pair);
PROTECT(t, field);
2014-06-29 04:57:07 +00:00
initClass(t, field->class_());
2014-06-29 04:57:07 +00:00
ACQUIRE_FIELD_FOR_WRITE(t, field);
setFieldValue(t, field->class_()->staticTable(), field, value);
}
2014-07-11 15:47:57 +00:00
void setFieldValueFromReference(MyThread* t,
GcPair* pair,
object instance,
uint32_t value)
{
PROTECT(t, instance);
2014-06-29 04:57:07 +00:00
GcField* field = resolveField(t, pair);
PROTECT(t, field);
2014-06-29 04:57:07 +00:00
ACQUIRE_FIELD_FOR_WRITE(t, field);
setFieldValue(t, instance, field, value);
}
2014-07-11 15:47:57 +00:00
uint64_t instanceOf64(Thread* t, GcClass* class_, object o)
{
return instanceOf(t, class_, o);
}
2014-07-11 15:47:57 +00:00
uint64_t instanceOfFromReference(Thread* t, GcPair* pair, object o)
{
PROTECT(t, o);
2014-07-11 15:47:57 +00:00
GcClass* c
= resolveClass(t,
cast<GcMethod>(t, pair->first())->class_()->loader(),
cast<GcReference>(t, pair->second())->name());
return instanceOf64(t, c, o);
}
2014-07-11 15:47:57 +00:00
uint64_t makeNewGeneral64(Thread* t, GcClass* class_)
{
PROTECT(t, class_);
initClass(t, class_);
return reinterpret_cast<uintptr_t>(makeNewGeneral(t, class_));
}
2014-07-11 15:47:57 +00:00
uint64_t makeNew64(Thread* t, GcClass* class_)
{
PROTECT(t, class_);
initClass(t, class_);
return reinterpret_cast<uintptr_t>(makeNew(t, class_));
}
2014-07-11 15:47:57 +00:00
uint64_t makeNewFromReference(Thread* t, GcPair* pair)
{
2014-07-11 15:47:57 +00:00
GcClass* class_
= resolveClass(t,
cast<GcMethod>(t, pair->first())->class_()->loader(),
cast<GcReference>(t, pair->second())->name());
PROTECT(t, class_);
initClass(t, class_);
return makeNewGeneral64(t, class_);
}
2014-07-11 15:47:57 +00:00
uint64_t getJClass64(Thread* t, GcClass* class_)
2010-12-03 20:42:13 +00:00
{
return reinterpret_cast<uintptr_t>(getJClass(t, class_));
}
2014-07-11 15:50:18 +00:00
void gcIfNecessary(MyThread* t)
2008-04-09 19:08:13 +00:00
{
stress(t);
if (UNLIKELY(t->getFlags() & Thread::UseBackupHeapFlag)) {
2008-04-09 19:08:13 +00:00
collect(t, Heap::MinorCollection);
}
}
void idleIfNecessary(MyThread* t)
{
if (UNLIKELY(t->m->exclusive)) {
ENTER(t, Thread::IdleState);
}
}
bool useLongJump(MyThread* t, uintptr_t target)
{
uintptr_t reach = t->arch->maximumImmediateJump();
FixedAllocator* a = codeAllocator(t);
uintptr_t start = reinterpret_cast<uintptr_t>(a->memory.begin());
uintptr_t end = reinterpret_cast<uintptr_t>(a->memory.begin())
+ a->memory.count;
assertT(t, end - start < reach);
return (target > end && (target - start) > reach)
or (target < start && (end - target) > reach);
}
FILE* compileLog = 0;
void logCompile(MyThread* t,
const void* code,
unsigned size,
const char* class_,
const char* name,
const char* spec);
unsigned simpleFrameMapTableSize(MyThread* t, GcMethod* method, GcIntArray* map)
{
int size = frameMapSizeInBits(t, method);
return ceilingDivide(map->length() * size, 32 + size);
}
#ifndef AVIAN_AOT_ONLY
2014-07-11 15:50:18 +00:00
unsigned resultSize(MyThread* t, unsigned code)
2007-12-09 22:45:43 +00:00
{
switch (code) {
case ByteField:
case BooleanField:
case CharField:
case ShortField:
case FloatField:
2008-02-11 17:21:41 +00:00
case IntField:
return 4;
case ObjectField:
return TargetBytesPerWord;
2007-09-25 23:53:11 +00:00
2007-12-09 22:45:43 +00:00
case LongField:
2008-02-11 17:21:41 +00:00
case DoubleField:
return 8;
2007-12-09 22:45:43 +00:00
case VoidField:
2008-02-11 17:21:41 +00:00
return 0;
2007-09-25 23:53:11 +00:00
2007-12-09 22:45:43 +00:00
default:
abort(t);
}
2007-12-09 22:45:43 +00:00
}
2014-05-01 18:44:42 +00:00
ir::Value* popField(MyThread* t, Frame* frame, int code)
{
switch (code) {
case ByteField:
case BooleanField:
case CharField:
case ShortField:
case IntField:
2014-06-01 20:22:14 +00:00
return frame->pop(ir::Type::i4());
case FloatField:
2014-06-01 20:22:14 +00:00
return frame->pop(ir::Type::f4());
case LongField:
2014-06-01 20:22:14 +00:00
return frame->popLarge(ir::Type::i8());
case DoubleField:
2014-06-01 20:22:14 +00:00
return frame->popLarge(ir::Type::f8());
case ObjectField:
2014-06-01 20:22:14 +00:00
return frame->pop(ir::Type::object());
2014-07-11 15:50:18 +00:00
default:
abort(t);
}
}
2014-07-11 15:50:18 +00:00
void compileSafePoint(MyThread* t, Compiler* c, Frame* frame)
{
2014-07-17 00:07:56 +00:00
c->nativeCall(
c->constant(getThunk(t, idleIfNecessaryThunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister()));
}
void compileDirectInvoke(MyThread* t,
Frame* frame,
2014-05-29 04:17:25 +00:00
GcMethod* target,
bool tailCall,
bool useThunk,
avian::codegen::Promise* addressPromise)
{
avian::codegen::Compiler* c = frame->c;
2014-07-11 15:50:18 +00:00
unsigned flags
= (avian::codegen::TailCalls and tailCall ? Compiler::TailJump : 0);
unsigned traceFlags;
if (addressPromise == 0 and useLongJump(t, methodAddress(t, target))) {
flags |= Compiler::LongJumpOrCall;
traceFlags = TraceElement::LongCall;
} else {
traceFlags = 0;
}
2014-07-11 15:47:57 +00:00
if (useThunk or (avian::codegen::TailCalls and tailCall
and (target->flags() & ACC_NATIVE))) {
if (frame->context->bootContext == 0) {
flags |= Compiler::Aligned;
}
if (avian::codegen::TailCalls and tailCall) {
traceFlags |= TraceElement::TailCall;
TraceElement* trace = frame->trace(target, traceFlags);
2014-07-11 15:50:18 +00:00
avian::codegen::Promise* returnAddressPromise
= new (frame->context->zone.allocate(sizeof(TraceElementPromise)))
TraceElementPromise(t->m->system, trace);
2014-06-01 20:22:14 +00:00
frame->stackCall(
c->promiseConstant(returnAddressPromise, ir::Type::iptr()),
target,
flags,
trace);
2014-06-01 20:22:14 +00:00
c->store(frame->absoluteAddressOperand(returnAddressPromise),
c->memory(c->threadRegister(),
ir::Type::iptr(),
TARGET_THREAD_TAILADDRESS));
2014-07-11 15:47:57 +00:00
c->exit(c->constant(
(target->flags() & ACC_NATIVE) ? nativeThunk(t) : defaultThunk(t),
ir::Type::iptr()));
} else {
2014-06-01 20:22:14 +00:00
return frame->stackCall(c->constant(defaultThunk(t), ir::Type::iptr()),
2014-05-01 19:56:39 +00:00
target,
flags,
frame->trace(target, traceFlags));
}
} else {
2014-05-01 18:44:42 +00:00
ir::Value* address
= (addressPromise
2014-06-01 20:22:14 +00:00
? c->promiseConstant(addressPromise, ir::Type::iptr())
: c->constant(methodAddress(t, target), ir::Type::iptr()));
frame->stackCall(
2014-05-01 19:56:39 +00:00
address,
target,
flags,
2014-07-11 15:47:57 +00:00
tailCall ? 0 : frame->trace((target->flags() & ACC_NATIVE) ? target : 0,
0));
}
}
2014-07-11 15:47:57 +00:00
bool compileDirectInvoke(MyThread* t,
Frame* frame,
GcMethod* target,
bool tailCall)
2007-12-09 22:45:43 +00:00
{
// don't bother calling an empty method unless calling it might
// cause the class to be initialized, which may have side effects
2014-07-11 15:47:57 +00:00
if (emptyMethod(t, target) and (not classNeedsInit(t, target->class_()))) {
2014-05-29 04:17:25 +00:00
frame->popFootprint(target->parameterFootprint());
2009-04-22 01:39:25 +00:00
tailCall = false;
} else {
BootContext* bc = frame->context->bootContext;
if (bc) {
2014-05-29 04:17:25 +00:00
if ((target->class_() == frame->context->method->class_()
or (not classNeedsInit(t, target->class_())))
2014-07-11 15:47:57 +00:00
and (not(avian::codegen::TailCalls and tailCall
and (target->flags() & ACC_NATIVE)))) {
2014-07-11 15:50:18 +00:00
avian::codegen::Promise* p = new (bc->zone)
avian::codegen::ListenPromise(t->m->system, bc->zone);
PROTECT(t, target);
object pointer = makePointer(t, p);
bc->calls = makeTriple(t, target, pointer, bc->calls);
compileDirectInvoke(t, frame, target, tailCall, false, p);
} else {
compileDirectInvoke(t, frame, target, tailCall, true, 0);
}
} else if (unresolved(t, methodAddress(t, target))
2014-07-11 15:47:57 +00:00
or classNeedsInit(t, target->class_())) {
compileDirectInvoke(t, frame, target, tailCall, true, 0);
} else {
compileDirectInvoke(t, frame, target, tailCall, false, 0);
}
2008-04-09 19:08:13 +00:00
}
2007-09-25 23:53:11 +00:00
2009-04-22 01:39:25 +00:00
return tailCall;
2007-12-09 22:45:43 +00:00
}
2014-05-01 20:30:45 +00:00
void compileReferenceInvoke(Frame* frame,
2014-05-01 18:44:42 +00:00
ir::Value* method,
2014-06-29 04:57:07 +00:00
GcReference* reference,
2014-05-01 18:44:42 +00:00
bool isStatic,
bool tailCall)
{
2014-05-01 20:30:45 +00:00
frame->referenceStackCall(isStatic,
method,
reference,
2014-05-01 18:44:42 +00:00
tailCall ? Compiler::TailJump : 0,
2014-05-01 20:30:45 +00:00
frame->trace(0, 0));
}
2014-07-11 15:47:57 +00:00
void compileDirectReferenceInvoke(MyThread* t,
Frame* frame,
Thunk thunk,
GcReference* reference,
bool isStatic,
bool tailCall)
{
avian::codegen::Compiler* c = frame->c;
PROTECT(t, reference);
GcPair* pair = makePair(t, frame->context->method, reference);
2014-06-01 20:22:14 +00:00
compileReferenceInvoke(
frame,
c->nativeCall(c->constant(getThunk(t, thunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::iptr(),
args(c->threadRegister(), frame->append(pair))),
2014-06-01 20:22:14 +00:00
reference,
isStatic,
tailCall);
}
void compileAbstractInvoke(Frame* frame,
2014-05-01 18:44:42 +00:00
ir::Value* method,
2014-05-29 04:17:25 +00:00
GcMethod* target,
2014-05-01 18:44:42 +00:00
bool tailCall)
{
frame->stackCall(
2014-05-01 19:56:39 +00:00
method, target, tailCall ? Compiler::TailJump : 0, frame->trace(0, 0));
}
2014-07-11 15:47:57 +00:00
void compileDirectAbstractInvoke(MyThread* t,
Frame* frame,
Thunk thunk,
GcMethod* target,
bool tailCall)
{
avian::codegen::Compiler* c = frame->c;
2014-07-11 15:47:57 +00:00
compileAbstractInvoke(
frame,
c->nativeCall(c->constant(getThunk(t, thunk), ir::Type::iptr()),
2014-07-17 00:07:56 +00:00
0,
frame->trace(0, 0),
ir::Type::iptr(),
args(c->threadRegister(), frame->append(target))),
2014-07-11 15:47:57 +00:00
target,
tailCall);
}
2014-07-11 15:50:18 +00:00
void handleMonitorEvent(MyThread* t, Frame* frame, intptr_t function)
{
avian::codegen::Compiler* c = frame->c;
2014-05-29 04:17:25 +00:00
GcMethod* method = frame->context->method;
2014-05-29 04:17:25 +00:00
if (method->flags() & ACC_SYNCHRONIZED) {
2014-05-01 18:44:42 +00:00
ir::Value* lock;
2014-05-29 04:17:25 +00:00
if (method->flags() & ACC_STATIC) {
PROTECT(t, method);
2014-06-29 04:57:07 +00:00
lock = frame->append(method->class_());
} else {
2014-05-01 13:18:12 +00:00
lock = loadLocal(
2014-06-01 20:22:14 +00:00
frame->context, 1, ir::Type::object(), savedTargetIndex(t, method));
}
c->nativeCall(c->constant(function, ir::Type::iptr()),
2014-07-17 00:07:56 +00:00
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(), lock));
}
}
2014-07-11 15:50:18 +00:00
void handleEntrance(MyThread* t, Frame* frame)
{
2014-05-29 04:17:25 +00:00
GcMethod* method = frame->context->method;
2014-07-11 15:47:57 +00:00
if ((method->flags() & (ACC_SYNCHRONIZED | ACC_STATIC)) == ACC_SYNCHRONIZED) {
// save 'this' pointer in case it is overwritten.
unsigned index = savedTargetIndex(t, method);
2014-05-01 13:18:12 +00:00
storeLocal(frame->context,
1,
2014-06-01 20:22:14 +00:00
ir::Type::object(),
loadLocal(frame->context, 1, ir::Type::object(), 0),
2014-05-01 13:18:12 +00:00
index);
2014-06-01 20:22:14 +00:00
frame->set(index, ir::Type::object());
}
2014-07-11 15:50:18 +00:00
handleMonitorEvent(
t, frame, getThunk(t, acquireMonitorForObjectOnEntranceThunk));
}
2014-07-11 15:50:18 +00:00
void handleExit(MyThread* t, Frame* frame)
{
2014-07-11 15:50:18 +00:00
handleMonitorEvent(t, frame, getThunk(t, releaseMonitorForObjectThunk));
}
2014-07-11 15:47:57 +00:00
bool inTryBlock(MyThread* t UNUSED, GcCode* code, unsigned ip)
{
2014-07-11 15:47:57 +00:00
GcExceptionHandlerTable* table
= cast<GcExceptionHandlerTable>(t, code->exceptionHandlerTable());
if (table) {
2014-06-29 04:57:07 +00:00
unsigned length = table->length();
for (unsigned i = 0; i < length; ++i) {
2014-06-29 04:57:07 +00:00
uint64_t eh = table->body()[i];
2014-07-11 15:50:18 +00:00
if (ip >= exceptionHandlerStart(eh) and ip < exceptionHandlerEnd(eh)) {
return true;
}
}
}
return false;
}
2014-07-11 15:47:57 +00:00
bool needsReturnBarrier(MyThread* t UNUSED, GcMethod* method)
{
2014-05-29 04:17:25 +00:00
return (method->flags() & ConstructorFlag)
2014-07-11 15:47:57 +00:00
and (method->class_()->vmFlags() & HasFinalMemberFlag);
}
2014-07-11 15:47:57 +00:00
bool returnsNext(MyThread* t, GcCode* code, unsigned ip)
{
2014-06-29 04:57:07 +00:00
switch (code->body()[ip]) {
case return_:
case areturn:
case ireturn:
case freturn:
case lreturn:
case dreturn:
return true;
case goto_: {
uint32_t offset = codeReadInt16(t, code, ++ip);
uint32_t newIp = (ip - 3) + offset;
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
return returnsNext(t, code, newIp);
}
case goto_w: {
uint32_t offset = codeReadInt32(t, code, ++ip);
uint32_t newIp = (ip - 5) + offset;
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2014-05-29 04:17:25 +00:00
return returnsNext(t, code, newIp);
}
default:
return false;
}
}
2014-07-11 15:47:57 +00:00
bool isTailCall(MyThread* t,
GcCode* code,
unsigned ip,
GcMethod* caller,
int calleeReturnCode,
GcByteArray* calleeClassName,
GcByteArray* calleeMethodName,
GcByteArray* calleeMethodSpec)
{
return avian::codegen::TailCalls
2014-07-11 15:47:57 +00:00
and ((caller->flags() & ACC_SYNCHRONIZED) == 0)
and (not inTryBlock(t, code, ip - 1))
and (not needsReturnBarrier(t, caller))
and (caller->returnCode() == VoidField
or caller->returnCode() == calleeReturnCode)
and returnsNext(t, code, ip)
and t->m->classpath->canTailCall(t,
caller,
calleeClassName,
calleeMethodName,
calleeMethodSpec);
}
bool isTailCall(MyThread* t,
GcCode* code,
unsigned ip,
GcMethod* caller,
GcMethod* callee)
{
return isTailCall(t,
code,
ip,
caller,
callee->returnCode(),
callee->class_()->name(),
callee->name(),
callee->spec());
}
bool isReferenceTailCall(MyThread* t,
GcCode* code,
unsigned ip,
GcMethod* caller,
GcReference* calleeReference)
{
return isTailCall(t,
code,
ip,
caller,
methodReferenceReturnCode(t, calleeReference),
calleeReference->class_(),
calleeReference->name(),
calleeReference->spec());
}
2014-07-11 15:50:18 +00:00
lir::TernaryOperation toCompilerJumpOp(MyThread* t, unsigned instruction)
{
switch (instruction) {
case ifeq:
case if_icmpeq:
case if_acmpeq:
case ifnull:
return lir::JumpIfEqual;
case ifne:
case if_icmpne:
case if_acmpne:
case ifnonnull:
return lir::JumpIfNotEqual;
case ifgt:
case if_icmpgt:
return lir::JumpIfGreater;
case ifge:
case if_icmpge:
return lir::JumpIfGreaterOrEqual;
case iflt:
case if_icmplt:
return lir::JumpIfLess;
case ifle:
case if_icmple:
return lir::JumpIfLessOrEqual;
default:
abort(t);
}
}
2014-05-01 18:14:27 +00:00
bool integerBranch(MyThread* t,
Frame* frame,
2014-06-29 04:57:07 +00:00
GcCode* code,
2014-05-01 18:14:27 +00:00
unsigned& ip,
2014-05-01 18:44:42 +00:00
ir::Value* a,
ir::Value* b,
2014-05-01 18:14:27 +00:00
unsigned* newIpp)
2009-10-07 00:50:32 +00:00
{
2014-06-29 04:57:07 +00:00
if (ip + 3 > code->length()) {
2009-10-07 00:50:32 +00:00
return false;
}
avian::codegen::Compiler* c = frame->c;
2014-06-29 04:57:07 +00:00
unsigned instruction = code->body()[ip++];
2009-10-07 00:50:32 +00:00
uint32_t offset = codeReadInt16(t, code, ip);
uint32_t newIp = (ip - 3) + offset;
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2014-05-01 18:44:42 +00:00
ir::Value* target = frame->machineIpValue(newIp);
2009-10-07 00:50:32 +00:00
switch (instruction) {
case ifeq:
case ifne:
case ifgt:
case ifge:
case iflt:
case ifle:
c->condJump(toCompilerJumpOp(t, instruction), a, b, target);
break;
2009-10-07 00:50:32 +00:00
default:
ip -= 3;
return false;
}
*newIpp = newIp;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
return true;
2009-10-07 00:50:32 +00:00
}
lir::TernaryOperation toCompilerFloatJumpOp(MyThread* t,
unsigned instruction,
bool lessIfUnordered)
{
2014-07-11 15:50:18 +00:00
switch (instruction) {
case ifeq:
return lir::JumpIfFloatEqual;
case ifne:
return lir::JumpIfFloatNotEqual;
case ifgt:
if (lessIfUnordered) {
return lir::JumpIfFloatGreater;
} else {
return lir::JumpIfFloatGreaterOrUnordered;
}
case ifge:
if (lessIfUnordered) {
return lir::JumpIfFloatGreaterOrEqual;
} else {
return lir::JumpIfFloatGreaterOrEqualOrUnordered;
}
case iflt:
if (lessIfUnordered) {
return lir::JumpIfFloatLessOrUnordered;
} else {
return lir::JumpIfFloatLess;
}
case ifle:
if (lessIfUnordered) {
return lir::JumpIfFloatLessOrEqualOrUnordered;
} else {
return lir::JumpIfFloatLessOrEqual;
}
default:
abort(t);
}
}
2014-05-01 18:14:27 +00:00
bool floatBranch(MyThread* t,
Frame* frame,
2014-06-29 04:57:07 +00:00
GcCode* code,
2014-05-01 18:14:27 +00:00
unsigned& ip,
bool lessIfUnordered,
2014-05-01 18:44:42 +00:00
ir::Value* a,
ir::Value* b,
2014-05-01 18:14:27 +00:00
unsigned* newIpp)
{
2014-06-29 04:57:07 +00:00
if (ip + 3 > code->length()) {
2009-10-07 00:50:32 +00:00
return false;
}
avian::codegen::Compiler* c = frame->c;
2014-06-29 04:57:07 +00:00
unsigned instruction = code->body()[ip++];
2009-10-07 00:50:32 +00:00
uint32_t offset = codeReadInt16(t, code, ip);
uint32_t newIp = (ip - 3) + offset;
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2014-05-01 18:44:42 +00:00
ir::Value* target = frame->machineIpValue(newIp);
2009-10-07 00:50:32 +00:00
switch (instruction) {
case ifeq:
case ifne:
case ifgt:
case ifge:
case iflt:
2009-10-07 00:50:32 +00:00
case ifle:
2014-07-11 15:50:18 +00:00
c->condJump(
toCompilerFloatJumpOp(t, instruction, lessIfUnordered), a, b, target);
break;
2009-10-07 00:50:32 +00:00
default:
2009-10-07 00:50:32 +00:00
ip -= 3;
return false;
}
*newIpp = newIp;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
return true;
}
2014-05-01 18:44:42 +00:00
ir::Value* popLongAddress(Frame* frame)
{
return TargetBytesPerWord == 8
2014-06-01 20:22:14 +00:00
? frame->popLarge(ir::Type::i8())
2014-07-12 17:54:19 +00:00
: frame->c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
frame->popLarge(ir::Type::i8()),
ir::Type::iptr());
}
2014-07-11 15:47:57 +00:00
bool intrinsic(MyThread* t UNUSED, Frame* frame, GcMethod* target)
{
2014-06-29 04:57:07 +00:00
#define MATCH(name, constant) \
(name->length() == sizeof(constant) \
and ::strcmp(reinterpret_cast<char*>(name->body().begin()), constant) == 0)
GcByteArray* className = target->class_()->name();
if (UNLIKELY(MATCH(className, "java/lang/Math"))) {
avian::codegen::Compiler* c = frame->c;
2014-05-29 04:17:25 +00:00
if (MATCH(target->name(), "sqrt") and MATCH(target->spec(), "(D)D")) {
frame->pushLarge(
2014-06-01 20:22:14 +00:00
ir::Type::f8(),
c->unaryOp(lir::FloatSquareRoot, frame->popLarge(ir::Type::f8())));
return true;
2014-05-29 04:17:25 +00:00
} else if (MATCH(target->name(), "abs")) {
if (MATCH(target->spec(), "(I)I")) {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->unaryOp(lir::Absolute, frame->pop(ir::Type::i4())));
return true;
2014-05-29 04:17:25 +00:00
} else if (MATCH(target->spec(), "(J)J")) {
2014-06-01 20:22:14 +00:00
frame->pushLarge(
ir::Type::i8(),
c->unaryOp(lir::Absolute, frame->popLarge(ir::Type::i8())));
return true;
2014-05-29 04:17:25 +00:00
} else if (MATCH(target->spec(), "(F)F")) {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::f4(),
c->unaryOp(lir::FloatAbsolute, frame->pop(ir::Type::f4())));
return true;
}
}
} else if (UNLIKELY(MATCH(className, "sun/misc/Unsafe"))) {
avian::codegen::Compiler* c = frame->c;
2014-05-29 04:17:25 +00:00
if (MATCH(target->name(), "getByte") and MATCH(target->spec(), "(J)B")) {
2014-05-01 18:44:42 +00:00
ir::Value* address = popLongAddress(frame);
2014-06-01 20:22:14 +00:00
frame->pop(ir::Type::object());
frame->push(ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(address, ir::Type::i1()),
ir::Type::i4()));
return true;
2014-07-11 15:47:57 +00:00
} else if (MATCH(target->name(), "putByte")
and MATCH(target->spec(), "(JB)V")) {
2014-06-01 20:22:14 +00:00
ir::Value* value = frame->pop(ir::Type::i4());
2014-05-01 18:44:42 +00:00
ir::Value* address = popLongAddress(frame);
2014-06-01 20:22:14 +00:00
frame->pop(ir::Type::object());
c->store(value, c->memory(address, ir::Type::i1()));
return true;
2014-07-11 15:47:57 +00:00
} else if ((MATCH(target->name(), "getShort")
and MATCH(target->spec(), "(J)S"))
or (MATCH(target->name(), "getChar")
and MATCH(target->spec(), "(J)C"))) {
2014-05-01 18:44:42 +00:00
ir::Value* address = popLongAddress(frame);
2014-06-01 20:22:14 +00:00
frame->pop(ir::Type::object());
frame->push(ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(address, ir::Type::i2()),
ir::Type::i4()));
return true;
2014-07-11 15:47:57 +00:00
} else if ((MATCH(target->name(), "putShort")
and MATCH(target->spec(), "(JS)V"))
or (MATCH(target->name(), "putChar")
and MATCH(target->spec(), "(JC)V"))) {
2014-06-01 20:22:14 +00:00
ir::Value* value = frame->pop(ir::Type::i4());
2014-05-01 18:44:42 +00:00
ir::Value* address = popLongAddress(frame);
2014-06-01 20:22:14 +00:00
frame->pop(ir::Type::object());
c->store(value, c->memory(address, ir::Type::i2()));
return true;
2014-07-11 15:47:57 +00:00
} else if ((MATCH(target->name(), "getInt")
and MATCH(target->spec(), "(J)I"))
or (MATCH(target->name(), "getFloat")
and MATCH(target->spec(), "(J)F"))) {
2014-05-01 18:44:42 +00:00
ir::Value* address = popLongAddress(frame);
2014-06-01 20:22:14 +00:00
frame->pop(ir::Type::object());
2014-05-29 04:17:25 +00:00
ir::Type type = MATCH(target->name(), "getInt") ? ir::Type::i4()
: ir::Type::f4();
2014-07-17 00:07:56 +00:00
frame->push(
type,
c->load(ir::ExtendMode::Signed, c->memory(address, type), type));
return true;
2014-07-11 15:47:57 +00:00
} else if ((MATCH(target->name(), "putInt")
and MATCH(target->spec(), "(JI)V"))
or (MATCH(target->name(), "putFloat")
and MATCH(target->spec(), "(JF)V"))) {
2014-05-29 04:17:25 +00:00
ir::Type type = MATCH(target->name(), "putInt") ? ir::Type::i4()
: ir::Type::f4();
ir::Value* value = frame->pop(type);
ir::Value* address = popLongAddress(frame);
2014-06-01 20:22:14 +00:00
frame->pop(ir::Type::object());
c->store(value, c->memory(address, type));
return true;
2014-07-11 15:47:57 +00:00
} else if ((MATCH(target->name(), "getLong")
and MATCH(target->spec(), "(J)J"))
or (MATCH(target->name(), "getDouble")
and MATCH(target->spec(), "(J)D"))) {
2014-05-01 18:44:42 +00:00
ir::Value* address = popLongAddress(frame);
2014-06-01 20:22:14 +00:00
frame->pop(ir::Type::object());
2014-05-29 04:17:25 +00:00
ir::Type type = MATCH(target->name(), "getLong") ? ir::Type::i8()
: ir::Type::f8();
2014-07-17 00:07:56 +00:00
frame->pushLarge(
type,
c->load(ir::ExtendMode::Signed, c->memory(address, type), type));
return true;
2014-07-11 15:47:57 +00:00
} else if ((MATCH(target->name(), "putLong")
and MATCH(target->spec(), "(JJ)V"))
or (MATCH(target->name(), "putDouble")
and MATCH(target->spec(), "(JD)V"))) {
2014-05-29 04:17:25 +00:00
ir::Type type = MATCH(target->name(), "putLong") ? ir::Type::i8()
: ir::Type::f8();
ir::Value* value = frame->popLarge(type);
ir::Value* address = popLongAddress(frame);
2014-06-01 20:22:14 +00:00
frame->pop(ir::Type::object());
c->store(value, c->memory(address, type));
return true;
2014-07-11 15:47:57 +00:00
} else if (MATCH(target->name(), "getAddress")
and MATCH(target->spec(), "(J)J")) {
2014-05-01 18:44:42 +00:00
ir::Value* address = popLongAddress(frame);
2014-06-01 20:22:14 +00:00
frame->pop(ir::Type::object());
frame->pushLarge(ir::Type::i8(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(address, ir::Type::iptr()),
ir::Type::i8()));
return true;
2014-07-11 15:47:57 +00:00
} else if (MATCH(target->name(), "putAddress")
and MATCH(target->spec(), "(JJ)V")) {
2014-06-01 20:22:14 +00:00
ir::Value* value = frame->popLarge(ir::Type::i8());
2014-05-01 18:44:42 +00:00
ir::Value* address = popLongAddress(frame);
2014-06-01 20:22:14 +00:00
frame->pop(ir::Type::object());
c->store(value, c->memory(address, ir::Type::iptr()));
return true;
}
}
return false;
}
2014-07-11 15:47:57 +00:00
unsigned targetFieldOffset(Context* context, GcField* field)
{
if (context->bootContext) {
return context->bootContext->resolver->fieldOffset(context->thread, field);
} else {
2014-06-29 04:57:07 +00:00
return field->offset();
}
}
class Stack {
public:
2014-07-11 15:50:18 +00:00
class MyResource : public Thread::AutoResource {
public:
2014-07-11 15:50:18 +00:00
MyResource(Stack* s) : AutoResource(s->thread), s(s)
{
}
2014-07-11 15:50:18 +00:00
virtual void release()
{
s->zone.dispose();
}
Stack* s;
};
2014-05-05 04:02:47 +00:00
Stack(MyThread* t) : thread(t), zone(t->m->heap, 0), resource(this)
2014-07-11 15:50:18 +00:00
{
}
2014-07-11 15:50:18 +00:00
~Stack()
{
zone.dispose();
}
2014-07-11 15:50:18 +00:00
void pushValue(uintptr_t v)
{
*static_cast<uintptr_t*>(push(BytesPerWord)) = v;
}
2014-07-11 15:50:18 +00:00
uintptr_t peekValue(unsigned offset)
{
return *static_cast<uintptr_t*>(peek((offset + 1) * BytesPerWord));
}
2014-07-11 15:50:18 +00:00
uintptr_t popValue()
{
uintptr_t v = peekValue(0);
pop(BytesPerWord);
return v;
}
2014-07-11 15:50:18 +00:00
void* push(unsigned size)
{
return zone.allocate(size);
}
2014-07-11 15:50:18 +00:00
void* peek(unsigned size)
{
return zone.peek(size);
}
2014-07-11 15:50:18 +00:00
void pop(unsigned size)
{
zone.pop(size);
}
MyThread* thread;
Zone zone;
MyResource resource;
};
class SwitchState {
public:
SwitchState(Compiler::State* state,
unsigned count,
unsigned defaultIp,
2014-05-01 18:44:42 +00:00
ir::Value* key,
avian::codegen::Promise* start,
int bottom,
2014-05-01 18:44:42 +00:00
int top)
: state(state),
count(count),
defaultIp(defaultIp),
key(key),
start(start),
bottom(bottom),
top(top),
index(0)
2014-07-11 15:50:18 +00:00
{
}
2014-07-11 15:50:18 +00:00
Frame* frame()
{
return reinterpret_cast<Frame*>(reinterpret_cast<uint8_t*>(this)
- pad(count * 4) - pad(sizeof(Frame)));
}
2014-07-11 15:50:18 +00:00
uint32_t* ipTable()
{
return reinterpret_cast<uint32_t*>(reinterpret_cast<uint8_t*>(this)
- pad(count * 4));
}
Compiler::State* state;
unsigned count;
unsigned defaultIp;
2014-05-01 18:44:42 +00:00
ir::Value* key;
avian::codegen::Promise* start;
int bottom;
int top;
unsigned index;
};
lir::TernaryOperation toCompilerBinaryOp(MyThread* t, unsigned instruction)
{
switch (instruction) {
case iadd:
case ladd:
return lir::Add;
case ior:
case lor:
return lir::Or;
case ishl:
case lshl:
return lir::ShiftLeft;
case ishr:
case lshr:
return lir::ShiftRight;
case iushr:
case lushr:
return lir::UnsignedShiftRight;
case fadd:
case dadd:
return lir::FloatAdd;
case fsub:
case dsub:
return lir::FloatSubtract;
case fmul:
case dmul:
return lir::FloatMultiply;
case fdiv:
case ddiv:
return lir::FloatDivide;
case frem:
case vm::drem:
return lir::FloatRemainder;
case iand:
case land:
return lir::And;
case isub:
case lsub:
return lir::Subtract;
case ixor:
case lxor:
return lir::Xor;
case imul:
case lmul:
return lir::Multiply;
default:
abort(t);
}
}
uintptr_t aioobThunk(MyThread* t);
uintptr_t stackOverflowThunk(MyThread* t);
void checkField(Thread* t, GcField* field, bool shouldBeStatic)
{
if (((field->flags() & ACC_STATIC) == 0) == shouldBeStatic) {
throwNew(t,
GcIncompatibleClassChangeError::Type,
"expected %s.%s to be %s",
field->class_()->name()->body().begin(),
field->name()->body().begin(),
shouldBeStatic ? "static" : "non-static");
}
}
2014-07-11 15:50:18 +00:00
void compile(MyThread* t,
Frame* initialFrame,
unsigned initialIp,
int exceptionHandlerStart = -1)
{
2014-07-11 15:50:18 +00:00
enum { Return, Unbranch, Unsubroutine, Untable0, Untable1, Unswitch };
Frame* frame = initialFrame;
avian::codegen::Compiler* c = frame->c;
Context* context = frame->context;
2014-06-28 04:00:05 +00:00
unsigned stackSize = context->method->code()->maxStack();
Stack stack(t);
unsigned ip = initialIp;
unsigned newIp;
stack.pushValue(Return);
2014-07-11 15:50:18 +00:00
start:
ir::Type* stackMap
= static_cast<ir::Type*>(stack.push(stackSize * sizeof(ir::Type)));
frame = new (stack.push(sizeof(Frame))) Frame(frame, stackMap);
2007-09-25 23:53:11 +00:00
2014-07-11 15:50:18 +00:00
loop:
GcCode* code = context->method->code();
2007-12-09 22:45:43 +00:00
PROTECT(t, code);
2014-05-29 04:17:25 +00:00
2014-06-29 04:57:07 +00:00
while (ip < code->length()) {
if (context->visitTable[frame->duplicatedIp(ip)]++) {
2007-12-09 22:45:43 +00:00
// we've already visited this part of the code
2008-04-20 05:23:08 +00:00
frame->visitLogicalIp(ip);
goto next;
2007-09-30 04:07:22 +00:00
}
2007-12-09 22:45:43 +00:00
frame->startLogicalIp(ip);
if (exceptionHandlerStart >= 0) {
2008-09-25 00:48:32 +00:00
c->initLocalsFromLogicalIp(exceptionHandlerStart);
exceptionHandlerStart = -1;
2008-04-19 07:03:59 +00:00
frame->pushObject();
2014-07-17 00:07:56 +00:00
c->nativeCall(
c->constant(getThunk(t, gcIfNecessaryThunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister()));
2008-04-09 19:08:13 +00:00
}
if (DebugInstructions) {
unsigned startingIp = ip;
fprintf(stderr, " stack: [");
for (size_t i = frame->localSize(); i < frame->sp; i++) {
2014-05-05 16:49:50 +00:00
ir::Type ty = frame->get(i);
2014-06-01 20:22:14 +00:00
if (ty == ir::Type::i4()) {
fprintf(stderr, "I");
2014-06-01 20:22:14 +00:00
} else if (ty == ir::Type::i8()) {
fprintf(stderr, "L");
2014-06-01 20:22:14 +00:00
} else if (ty == ir::Type::f4()) {
2014-05-05 16:49:50 +00:00
fprintf(stderr, "F");
2014-06-01 20:22:14 +00:00
} else if (ty == ir::Type::f8()) {
2014-05-05 16:49:50 +00:00
fprintf(stderr, "D");
2014-06-01 20:22:14 +00:00
} else if (ty == ir::Type::object()) {
fprintf(stderr, "O");
2014-05-05 16:49:50 +00:00
} else {
fprintf(stderr, "?");
}
}
fprintf(stderr, "]\n");
fprintf(stderr, "% 5d: ", startingIp);
2014-06-29 04:57:07 +00:00
avian::jvm::debug::printInstruction(code->body().begin(), startingIp);
fprintf(stderr, "\n");
}
2014-06-29 04:57:07 +00:00
unsigned instruction = code->body()[ip++];
2007-09-25 23:53:11 +00:00
2007-12-09 22:45:43 +00:00
switch (instruction) {
case aaload:
case baload:
case caload:
case daload:
case faload:
case iaload:
case laload:
case saload: {
2014-06-01 20:22:14 +00:00
ir::Value* index = frame->pop(ir::Type::i4());
ir::Value* array = frame->pop(ir::Type::object());
if (inTryBlock(t, code, ip - 1)) {
c->saveLocals();
frame->trace(0, 0);
}
if (CheckArrayBounds) {
c->checkBounds(array, TargetArrayLength, index, aioobThunk(t));
}
2007-09-25 23:53:11 +00:00
switch (instruction) {
case aaload:
frame->push(
2014-06-01 20:22:14 +00:00
ir::Type::object(),
c->load(
2014-07-12 17:54:19 +00:00
ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(array, ir::Type::object(), TargetArrayBody, index),
ir::Type::object()));
break;
case faload:
2014-06-01 20:22:14 +00:00
frame->push(
ir::Type::f4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(array, ir::Type::f4(), TargetArrayBody, index),
ir::Type::f4()));
break;
2009-11-30 15:08:45 +00:00
case iaload:
2014-06-01 20:22:14 +00:00
frame->push(
ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(array, ir::Type::i4(), TargetArrayBody, index),
ir::Type::i4()));
break;
case baload:
2014-06-01 20:22:14 +00:00
frame->push(
ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(array, ir::Type::i1(), TargetArrayBody, index),
ir::Type::i4()));
break;
case caload:
2014-06-01 20:22:14 +00:00
frame->push(
ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Unsigned,
2014-06-01 20:22:14 +00:00
c->memory(array, ir::Type::i2(), TargetArrayBody, index),
ir::Type::i4()));
break;
case daload:
frame->pushLarge(
2014-06-01 20:22:14 +00:00
ir::Type::f8(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(array, ir::Type::f8(), TargetArrayBody, index),
ir::Type::f8()));
break;
case laload:
frame->pushLarge(
2014-06-01 20:22:14 +00:00
ir::Type::i8(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(array, ir::Type::i8(), TargetArrayBody, index),
ir::Type::i8()));
break;
case saload:
2014-06-01 20:22:14 +00:00
frame->push(
ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(array, ir::Type::i2(), TargetArrayBody, index),
ir::Type::i4()));
break;
2007-12-09 22:45:43 +00:00
}
} break;
2007-12-09 22:45:43 +00:00
case aastore:
case bastore:
case castore:
case dastore:
case fastore:
case iastore:
case lastore:
case sastore: {
2014-05-01 18:44:42 +00:00
ir::Value* value;
if (instruction == lastore) {
2014-06-01 20:22:14 +00:00
value = frame->popLarge(ir::Type::i8());
} else if (instruction == dastore) {
2014-06-01 20:22:14 +00:00
value = frame->popLarge(ir::Type::f8());
2007-12-09 22:45:43 +00:00
} else if (instruction == aastore) {
2014-06-01 20:22:14 +00:00
value = frame->pop(ir::Type::object());
} else if (instruction == fastore) {
2014-06-01 20:22:14 +00:00
value = frame->pop(ir::Type::f4());
2007-12-09 22:45:43 +00:00
} else {
2014-06-01 20:22:14 +00:00
value = frame->pop(ir::Type::i4());
2007-12-09 22:45:43 +00:00
}
2007-09-30 02:48:27 +00:00
2014-06-01 20:22:14 +00:00
ir::Value* index = frame->pop(ir::Type::i4());
ir::Value* array = frame->pop(ir::Type::object());
if (inTryBlock(t, code, ip - 1)) {
c->saveLocals();
frame->trace(0, 0);
}
if (CheckArrayBounds) {
c->checkBounds(array, TargetArrayLength, index, aioobThunk(t));
}
switch (instruction) {
case aastore: {
c->nativeCall(
c->constant(getThunk(t, setMaybeNullThunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(),
array,
c->binaryOp(lir::Add,
ir::Type::i4(),
c->constant(TargetArrayBody, ir::Type::i4()),
c->binaryOp(lir::ShiftLeft,
ir::Type::i4(),
c->constant(log(TargetBytesPerWord),
ir::Type::i4()),
index)),
value));
} break;
case fastore:
2014-06-01 20:22:14 +00:00
c->store(value,
c->memory(array, ir::Type::f4(), TargetArrayBody, index));
break;
case iastore:
2014-06-01 20:22:14 +00:00
c->store(value,
c->memory(array, ir::Type::i4(), TargetArrayBody, index));
break;
case bastore:
2014-06-01 20:22:14 +00:00
c->store(value,
c->memory(array, ir::Type::i1(), TargetArrayBody, index));
break;
case castore:
case sastore:
2014-06-01 20:22:14 +00:00
c->store(value,
c->memory(array, ir::Type::i2(), TargetArrayBody, index));
break;
case dastore:
2014-06-01 20:22:14 +00:00
c->store(value,
c->memory(array, ir::Type::f8(), TargetArrayBody, index));
break;
case lastore:
2014-06-01 20:22:14 +00:00
c->store(value,
c->memory(array, ir::Type::i8(), TargetArrayBody, index));
break;
2007-12-09 22:45:43 +00:00
}
} break;
2007-09-30 15:52:21 +00:00
2007-12-09 22:45:43 +00:00
case aconst_null:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::object(), c->constant(0, ir::Type::object()));
2007-12-09 22:45:43 +00:00
break;
2007-09-25 23:53:11 +00:00
2007-12-09 22:45:43 +00:00
case aload:
2014-06-29 04:57:07 +00:00
frame->load(ir::Type::object(), code->body()[ip++]);
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case aload_0:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::object(), 0);
2007-12-09 22:45:43 +00:00
break;
2007-10-08 23:13:55 +00:00
2007-12-09 22:45:43 +00:00
case aload_1:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::object(), 1);
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case aload_2:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::object(), 2);
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case aload_3:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::object(), 3);
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case anewarray: {
uint16_t index = codeReadInt16(t, code, ip);
2014-05-29 04:17:25 +00:00
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
PROTECT(t, reference);
2014-07-11 15:47:57 +00:00
GcClass* class_
= resolveClassInPool(t, context->method, index - 1, false);
2014-06-01 20:22:14 +00:00
ir::Value* length = frame->pop(ir::Type::i4());
2007-10-08 23:13:55 +00:00
object argument;
Thunk thunk;
if (LIKELY(class_)) {
argument = class_;
thunk = makeBlankObjectArrayThunk;
} else {
argument = makePair(t, context->method, reference);
thunk = makeBlankObjectArrayFromReferenceThunk;
}
frame->push(
ir::Type::object(),
c->nativeCall(
c->constant(getThunk(t, thunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::object(),
args(c->threadRegister(), frame->append(argument), length)));
2007-12-09 22:45:43 +00:00
} break;
case areturn: {
handleExit(t, frame);
2014-06-01 20:22:14 +00:00
c->return_(frame->pop(ir::Type::object()));
2014-07-11 15:50:18 +00:00
}
goto next;
case arraylength: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(frame->pop(ir::Type::object()),
ir::Type::iptr(),
TargetArrayLength),
2014-06-01 20:22:14 +00:00
ir::Type::i4()));
} break;
2007-10-04 03:19:39 +00:00
2007-12-09 22:45:43 +00:00
case astore:
2014-06-29 04:57:07 +00:00
frame->store(ir::Type::object(), code->body()[ip++]);
2007-12-09 22:45:43 +00:00
break;
2007-10-10 21:34:04 +00:00
2007-12-09 22:45:43 +00:00
case astore_0:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::object(), 0);
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case astore_1:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::object(), 1);
2007-12-09 22:45:43 +00:00
break;
2007-10-10 21:34:04 +00:00
2007-12-09 22:45:43 +00:00
case astore_2:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::object(), 2);
2007-12-09 22:45:43 +00:00
break;
2007-10-10 21:34:04 +00:00
2007-12-09 22:45:43 +00:00
case astore_3:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::object(), 3);
2007-12-09 22:45:43 +00:00
break;
2007-10-10 21:34:04 +00:00
case athrow: {
2014-06-01 20:22:14 +00:00
ir::Value* target = frame->pop(ir::Type::object());
c->nativeCall(c->constant(getThunk(t, throw_Thunk), ir::Type::iptr()),
Compiler::NoReturn,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(), target));
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
c->nullaryOp(lir::Trap);
2014-07-11 15:50:18 +00:00
}
goto next;
2007-12-09 22:45:43 +00:00
case bipush:
2014-07-11 15:47:57 +00:00
frame->push(
ir::Type::i4(),
c->constant(static_cast<int8_t>(code->body()[ip++]), ir::Type::i4()));
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case checkcast: {
uint16_t index = codeReadInt16(t, code, ip);
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
PROTECT(t, reference);
2014-07-11 15:47:57 +00:00
GcClass* class_
= resolveClassInPool(t, context->method, index - 1, false);
object argument;
Thunk thunk;
if (LIKELY(class_)) {
argument = class_;
thunk = checkCastThunk;
} else {
argument = makePair(t, context->method, reference);
thunk = checkCastFromReferenceThunk;
}
2014-05-01 18:44:42 +00:00
ir::Value* instance = c->peek(1, 0);
c->nativeCall(
c->constant(getThunk(t, thunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(), frame->append(argument), instance));
2007-12-09 22:45:43 +00:00
} break;
2007-10-10 21:34:04 +00:00
2007-12-09 22:45:43 +00:00
case d2f: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::f4(),
c->f2f(ir::Type::f4(), frame->popLarge(ir::Type::f8())));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case d2i: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->f2i(ir::Type::i4(), frame->popLarge(ir::Type::f8())));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case d2l: {
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::i8(),
c->f2i(ir::Type::i8(), frame->popLarge(ir::Type::f8())));
2007-12-09 22:45:43 +00:00
} break;
2007-10-10 21:34:04 +00:00
case dadd:
case dsub:
case dmul:
case ddiv:
case vm::drem: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->popLarge(ir::Type::f8());
ir::Value* b = frame->popLarge(ir::Type::f8());
frame->pushLarge(
2014-06-01 20:22:14 +00:00
ir::Type::f8(),
c->binaryOp(
toCompilerBinaryOp(t, instruction), ir::Type::f8(), a, b));
2007-12-09 22:45:43 +00:00
} break;
2007-10-10 21:34:04 +00:00
2007-12-09 22:45:43 +00:00
case dcmpg: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->popLarge(ir::Type::f8());
ir::Value* b = frame->popLarge(ir::Type::f8());
if (floatBranch(t, frame, code, ip, false, a, b, &newIp)) {
goto branch;
} else {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->nativeCall(c->constant(getThunk(t, compareDoublesGThunk),
ir::Type::iptr()),
0,
0,
ir::Type::i4(),
args(nullptr, a, nullptr, b)));
}
2007-12-09 22:45:43 +00:00
} break;
2007-10-10 21:34:04 +00:00
2007-12-09 22:45:43 +00:00
case dcmpl: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->popLarge(ir::Type::f8());
ir::Value* b = frame->popLarge(ir::Type::f8());
if (floatBranch(t, frame, code, ip, true, a, b, &newIp)) {
goto branch;
} else {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->nativeCall(c->constant(getThunk(t, compareDoublesLThunk),
ir::Type::iptr()),
0,
0,
ir::Type::i4(),
args(nullptr, a, nullptr, b)));
}
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case dconst_0:
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::f8(),
c->constant(doubleToBits(0.0), ir::Type::f8()));
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case dconst_1:
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::f8(),
c->constant(doubleToBits(1.0), ir::Type::f8()));
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case dneg: {
2014-06-01 20:22:14 +00:00
frame->pushLarge(
ir::Type::f8(),
c->unaryOp(lir::FloatNegate, frame->popLarge(ir::Type::f8())));
2007-12-09 22:45:43 +00:00
} break;
2014-06-29 04:57:07 +00:00
case vm::dup:
2007-12-09 22:45:43 +00:00
frame->dup();
break;
2007-12-09 22:45:43 +00:00
case dup_x1:
frame->dupX1();
break;
2007-12-09 22:45:43 +00:00
case dup_x2:
frame->dupX2();
break;
2014-06-29 04:57:07 +00:00
case vm::dup2:
2007-12-09 22:45:43 +00:00
frame->dup2();
break;
2007-12-09 22:45:43 +00:00
case dup2_x1:
frame->dup2X1();
break;
2007-12-09 22:45:43 +00:00
case dup2_x2:
frame->dup2X2();
break;
2007-10-09 17:15:40 +00:00
2007-12-09 22:45:43 +00:00
case f2d: {
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::f8(),
c->f2f(ir::Type::f8(), frame->pop(ir::Type::f4())));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case f2i: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->f2i(ir::Type::i4(), frame->pop(ir::Type::f4())));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case f2l: {
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::i8(),
c->f2i(ir::Type::i8(), frame->pop(ir::Type::f4())));
2007-12-09 22:45:43 +00:00
} break;
case fadd:
case fsub:
case fmul:
case fdiv:
case frem: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->pop(ir::Type::f4());
ir::Value* b = frame->pop(ir::Type::f4());
frame->push(
2014-06-01 20:22:14 +00:00
ir::Type::f4(),
c->binaryOp(
toCompilerBinaryOp(t, instruction), ir::Type::f4(), a, b));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case fcmpg: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->pop(ir::Type::f4());
ir::Value* b = frame->pop(ir::Type::f4());
if (floatBranch(t, frame, code, ip, false, a, b, &newIp)) {
goto branch;
} else {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->nativeCall(c->constant(getThunk(t, compareFloatsGThunk),
ir::Type::iptr()),
0,
0,
ir::Type::i4(),
args(a, b)));
}
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case fcmpl: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->pop(ir::Type::f4());
ir::Value* b = frame->pop(ir::Type::f4());
if (floatBranch(t, frame, code, ip, true, a, b, &newIp)) {
goto branch;
} else {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->nativeCall(c->constant(getThunk(t, compareFloatsLThunk),
ir::Type::iptr()),
0,
0,
ir::Type::i4(),
args(a, b)));
}
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case fconst_0:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::f4(),
c->constant(floatToBits(0.0), ir::Type::f4()));
2007-12-09 22:45:43 +00:00
break;
2014-05-29 04:17:25 +00:00
2007-12-09 22:45:43 +00:00
case fconst_1:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::f4(),
c->constant(floatToBits(1.0), ir::Type::f4()));
2007-12-09 22:45:43 +00:00
break;
2014-05-29 04:17:25 +00:00
2007-12-09 22:45:43 +00:00
case fconst_2:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::f4(),
c->constant(floatToBits(2.0), ir::Type::f4()));
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case fneg: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::f4(),
c->unaryOp(lir::FloatNegate, frame->pop(ir::Type::f4())));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case getfield:
case getstatic: {
uint16_t index = codeReadInt16(t, code, ip);
2014-05-29 04:17:25 +00:00
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
PROTECT(t, reference);
2014-06-29 04:57:07 +00:00
GcField* field = resolveField(t, context->method, index - 1, false);
if (LIKELY(field)) {
2014-07-11 15:47:57 +00:00
if ((field->flags() & ACC_VOLATILE) and TargetBytesPerWord == 4
and (field->code() == DoubleField or field->code() == LongField)) {
PROTECT(t, field);
c->nativeCall(c->constant(getThunk(t, acquireMonitorForObjectThunk),
ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(), frame->append(field)));
}
2014-05-01 18:44:42 +00:00
ir::Value* table;
if (instruction == getstatic) {
checkField(t, field, true);
PROTECT(t, field);
2014-06-29 04:57:07 +00:00
if (classNeedsInit(t, field->class_())) {
c->nativeCall(
2014-07-11 15:47:57 +00:00
c->constant(getThunk(t, tryInitClassThunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
2014-07-17 00:07:56 +00:00
args(c->threadRegister(), frame->append(field->class_())));
}
2014-06-29 04:57:07 +00:00
table = frame->append(field->class_()->staticTable());
} else {
checkField(t, field, false);
2014-06-01 20:22:14 +00:00
table = frame->pop(ir::Type::object());
if (inTryBlock(t, code, ip - 3)) {
c->saveLocals();
frame->trace(0, 0);
}
}
2014-06-29 04:57:07 +00:00
switch (field->code()) {
case ByteField:
case BooleanField:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(table,
ir::Type::i1(),
targetFieldOffset(context, field)),
ir::Type::i4()));
break;
case CharField:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Unsigned,
2014-06-01 20:22:14 +00:00
c->memory(table,
ir::Type::i2(),
targetFieldOffset(context, field)),
ir::Type::i4()));
break;
case ShortField:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(table,
ir::Type::i2(),
targetFieldOffset(context, field)),
ir::Type::i4()));
break;
case FloatField:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::f4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(table,
ir::Type::f4(),
targetFieldOffset(context, field)),
ir::Type::f4()));
break;
case IntField:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(table,
ir::Type::i4(),
targetFieldOffset(context, field)),
ir::Type::i4()));
break;
case DoubleField:
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::f8(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(table,
ir::Type::f8(),
targetFieldOffset(context, field)),
ir::Type::f8()));
break;
case LongField:
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::i8(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
c->memory(table,
ir::Type::i8(),
targetFieldOffset(context, field)),
ir::Type::i8()));
break;
case ObjectField:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::object(),
2014-07-12 17:54:19 +00:00
c->load(ir::ExtendMode::Signed,
c->memory(table,
2014-06-01 20:22:14 +00:00
ir::Type::object(),
targetFieldOffset(context, field)),
2014-06-01 20:22:14 +00:00
ir::Type::object()));
break;
default:
abort(t);
}
2009-03-03 03:18:15 +00:00
2014-06-29 04:57:07 +00:00
if (field->flags() & ACC_VOLATILE) {
2014-07-11 15:47:57 +00:00
if (TargetBytesPerWord == 4 and (field->code() == DoubleField
or field->code() == LongField)) {
c->nativeCall(c->constant(getThunk(t, releaseMonitorForObjectThunk),
2014-07-17 00:07:56 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(), frame->append(field)));
} else {
c->nullaryOp(lir::LoadBarrier);
}
}
} else {
2014-06-29 04:57:07 +00:00
GcReference* ref = cast<GcReference>(t, reference);
PROTECT(t, ref);
2014-07-11 15:47:57 +00:00
int fieldCode = vm::fieldCode(t, ref->spec()->body()[0]);
GcPair* pair = makePair(t, context->method, reference);
ir::Type rType = operandTypeForFieldCode(t, fieldCode);
2014-05-01 18:44:42 +00:00
ir::Value* result;
if (instruction == getstatic) {
result = c->nativeCall(
c->constant(getThunk(t, getStaticFieldValueFromReferenceThunk),
2014-06-01 20:22:14 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
rType,
2014-07-17 00:07:56 +00:00
args(c->threadRegister(), frame->append(pair)));
} else {
2014-06-01 20:22:14 +00:00
ir::Value* instance = frame->pop(ir::Type::object());
result = c->nativeCall(
c->constant(getThunk(t, getFieldValueFromReferenceThunk),
2014-06-01 20:22:14 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
rType,
2014-07-17 00:07:56 +00:00
args(c->threadRegister(), frame->append(pair), instance));
}
frame->pushReturnValue(fieldCode, result);
2009-03-03 03:18:15 +00:00
}
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case goto_: {
uint32_t offset = codeReadInt16(t, code, ip);
uint32_t newIp = (ip - 3) + offset;
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2014-07-11 15:50:18 +00:00
if (newIp <= ip) {
compileSafePoint(t, c, frame);
}
c->jmp(frame->machineIpValue(newIp));
2007-12-09 22:45:43 +00:00
ip = newIp;
} break;
2007-12-09 22:45:43 +00:00
case goto_w: {
uint32_t offset = codeReadInt32(t, code, ip);
uint32_t newIp = (ip - 5) + offset;
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2014-07-11 15:50:18 +00:00
if (newIp <= ip) {
compileSafePoint(t, c, frame);
}
c->jmp(frame->machineIpValue(newIp));
2007-12-09 22:45:43 +00:00
ip = newIp;
} break;
2007-12-09 22:45:43 +00:00
case i2b: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->truncateThenExtend(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
ir::Type::i4(),
ir::Type::i1(),
frame->pop(ir::Type::i4())));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case i2c: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->truncateThenExtend(ir::ExtendMode::Unsigned,
2014-06-01 20:22:14 +00:00
ir::Type::i4(),
ir::Type::i2(),
frame->pop(ir::Type::i4())));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case i2d: {
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::f8(),
c->i2f(ir::Type::f8(), frame->pop(ir::Type::i4())));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case i2f: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::f4(),
c->i2f(ir::Type::f4(), frame->pop(ir::Type::i4())));
2007-12-09 22:45:43 +00:00
} break;
case i2l:
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::i8(),
2014-07-12 17:54:19 +00:00
c->truncateThenExtend(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
ir::Type::i8(),
ir::Type::i4(),
frame->pop(ir::Type::i4())));
break;
2007-10-04 03:19:39 +00:00
2007-12-09 22:45:43 +00:00
case i2s: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
2014-07-12 17:54:19 +00:00
c->truncateThenExtend(ir::ExtendMode::Signed,
2014-06-01 20:22:14 +00:00
ir::Type::i4(),
ir::Type::i2(),
frame->pop(ir::Type::i4())));
2007-12-09 22:45:43 +00:00
} break;
2014-05-29 04:17:25 +00:00
case iadd:
case iand:
case ior:
case ishl:
case ishr:
case iushr:
case isub:
case ixor:
case imul: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->pop(ir::Type::i4());
ir::Value* b = frame->pop(ir::Type::i4());
frame->push(
2014-06-01 20:22:14 +00:00
ir::Type::i4(),
c->binaryOp(
toCompilerBinaryOp(t, instruction), ir::Type::i4(), a, b));
2007-12-09 22:45:43 +00:00
} break;
2007-10-04 00:41:54 +00:00
2007-12-09 22:45:43 +00:00
case iconst_m1:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(), c->constant(-1, ir::Type::i4()));
2007-12-09 22:45:43 +00:00
break;
2007-10-04 00:41:54 +00:00
2007-12-09 22:45:43 +00:00
case iconst_0:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(), c->constant(0, ir::Type::i4()));
2007-12-09 22:45:43 +00:00
break;
2007-10-04 00:41:54 +00:00
2007-12-09 22:45:43 +00:00
case iconst_1:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(), c->constant(1, ir::Type::i4()));
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case iconst_2:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(), c->constant(2, ir::Type::i4()));
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case iconst_3:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(), c->constant(3, ir::Type::i4()));
2007-12-09 22:45:43 +00:00
break;
2007-09-30 02:48:27 +00:00
2007-12-09 22:45:43 +00:00
case iconst_4:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(), c->constant(4, ir::Type::i4()));
2007-12-09 22:45:43 +00:00
break;
2007-09-30 02:48:27 +00:00
2007-12-09 22:45:43 +00:00
case iconst_5:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(), c->constant(5, ir::Type::i4()));
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case idiv: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->pop(ir::Type::i4());
ir::Value* b = frame->pop(ir::Type::i4());
if (inTryBlock(t, code, ip - 1)) {
c->saveLocals();
frame->trace(0, 0);
}
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->binaryOp(lir::Divide, ir::Type::i4(), a, b));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case if_acmpeq:
case if_acmpne: {
uint32_t offset = codeReadInt16(t, code, ip);
newIp = (ip - 3) + offset;
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2014-07-11 15:50:18 +00:00
if (newIp <= ip) {
compileSafePoint(t, c, frame);
}
2014-05-01 18:44:42 +00:00
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->pop(ir::Type::object());
ir::Value* b = frame->pop(ir::Type::object());
ir::Value* target = frame->machineIpValue(newIp);
c->condJump(toCompilerJumpOp(t, instruction), a, b, target);
2014-07-11 15:50:18 +00:00
}
goto branch;
2007-12-09 22:45:43 +00:00
case if_icmpeq:
case if_icmpne:
case if_icmpgt:
case if_icmpge:
case if_icmplt:
case if_icmple: {
uint32_t offset = codeReadInt16(t, code, ip);
newIp = (ip - 3) + offset;
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2014-07-11 15:50:18 +00:00
if (newIp <= ip) {
compileSafePoint(t, c, frame);
}
2014-05-01 18:44:42 +00:00
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->pop(ir::Type::i4());
ir::Value* b = frame->pop(ir::Type::i4());
ir::Value* target = frame->machineIpValue(newIp);
c->condJump(toCompilerJumpOp(t, instruction), a, b, target);
2014-07-11 15:50:18 +00:00
}
goto branch;
2007-10-03 00:22:48 +00:00
2007-12-09 22:45:43 +00:00
case ifeq:
case ifne:
case ifgt:
case ifge:
case iflt:
case ifle: {
uint32_t offset = codeReadInt16(t, code, ip);
newIp = (ip - 3) + offset;
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2007-10-03 00:22:48 +00:00
ir::Value* target = frame->machineIpValue(newIp);
2014-07-11 15:50:18 +00:00
if (newIp <= ip) {
compileSafePoint(t, c, frame);
}
2014-06-01 20:22:14 +00:00
ir::Value* a = c->constant(0, ir::Type::i4());
ir::Value* b = frame->pop(ir::Type::i4());
2009-10-07 00:50:32 +00:00
c->condJump(toCompilerJumpOp(t, instruction), a, b, target);
2014-07-11 15:50:18 +00:00
}
goto branch;
2007-12-09 22:45:43 +00:00
case ifnull:
case ifnonnull: {
uint32_t offset = codeReadInt16(t, code, ip);
newIp = (ip - 3) + offset;
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2014-07-11 15:50:18 +00:00
if (newIp <= ip) {
compileSafePoint(t, c, frame);
}
2014-06-01 20:22:14 +00:00
ir::Value* a = c->constant(0, ir::Type::object());
ir::Value* b = frame->pop(ir::Type::object());
ir::Value* target = frame->machineIpValue(newIp);
2007-09-30 02:48:27 +00:00
c->condJump(toCompilerJumpOp(t, instruction), a, b, target);
2014-07-11 15:50:18 +00:00
}
goto branch;
2007-09-29 21:08:29 +00:00
2007-12-09 22:45:43 +00:00
case iinc: {
2014-06-29 04:57:07 +00:00
uint8_t index = code->body()[ip++];
int8_t count = code->body()[ip++];
2007-09-29 21:08:29 +00:00
storeLocal(context,
1,
2014-06-01 20:22:14 +00:00
ir::Type::i4(),
c->binaryOp(lir::Add,
2014-06-01 20:22:14 +00:00
ir::Type::i4(),
c->constant(count, ir::Type::i4()),
loadLocal(context, 1, ir::Type::i4(), index)),
index);
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case iload:
2014-06-29 04:57:07 +00:00
frame->load(ir::Type::i4(), code->body()[ip++]);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 15:01:57 +00:00
case fload:
2014-06-29 04:57:07 +00:00
frame->load(ir::Type::f4(), code->body()[ip++]);
2014-05-02 15:01:57 +00:00
break;
2007-12-09 22:45:43 +00:00
case iload_0:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::i4(), 0);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 15:01:57 +00:00
case fload_0:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::f4(), 0);
2014-05-02 15:01:57 +00:00
break;
2007-12-09 22:45:43 +00:00
case iload_1:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::i4(), 1);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 15:01:57 +00:00
case fload_1:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::f4(), 1);
2014-05-02 15:01:57 +00:00
break;
2007-12-09 22:45:43 +00:00
case iload_2:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::i4(), 2);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 15:01:57 +00:00
case fload_2:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::f4(), 2);
2014-05-02 15:01:57 +00:00
break;
2007-10-03 00:22:48 +00:00
2007-12-09 22:45:43 +00:00
case iload_3:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::i4(), 3);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 15:01:57 +00:00
case fload_3:
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::f4(), 3);
2014-05-02 15:01:57 +00:00
break;
2007-10-03 00:22:48 +00:00
case ineg: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->unaryOp(lir::Negate, frame->pop(ir::Type::i4())));
} break;
2007-12-09 22:45:43 +00:00
case instanceof: {
uint16_t index = codeReadInt16(t, code, ip);
2007-09-30 04:07:22 +00:00
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
PROTECT(t, reference);
2014-07-11 15:47:57 +00:00
GcClass* class_
= resolveClassInPool(t, context->method, index - 1, false);
2014-06-01 20:22:14 +00:00
ir::Value* instance = frame->pop(ir::Type::object());
object argument;
Thunk thunk;
if (LIKELY(class_)) {
argument = class_;
thunk = instanceOf64Thunk;
} else {
argument = makePair(t, context->method, reference);
thunk = instanceOfFromReferenceThunk;
}
2007-09-30 04:07:22 +00:00
2014-07-17 00:07:56 +00:00
frame->push(
ir::Type::i4(),
c->nativeCall(
c->constant(getThunk(t, thunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::i4(),
args(c->threadRegister(), frame->append(argument), instance)));
2007-12-09 22:45:43 +00:00
} break;
2007-09-30 02:48:27 +00:00
2007-12-09 22:45:43 +00:00
case invokeinterface: {
context->leaf = false;
2007-12-09 22:45:43 +00:00
uint16_t index = codeReadInt16(t, code, ip);
ip += 2;
2007-09-30 02:48:27 +00:00
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
2007-09-30 02:48:27 +00:00
PROTECT(t, reference);
2014-05-29 04:17:25 +00:00
GcMethod* target = resolveMethod(t, context->method, index - 1, false);
2007-09-30 02:48:27 +00:00
object argument;
Thunk thunk;
unsigned parameterFootprint;
int returnCode;
bool tailCall;
if (LIKELY(target)) {
checkMethod(t, target, false);
argument = target;
thunk = findInterfaceMethodFromInstanceThunk;
2014-05-29 04:17:25 +00:00
parameterFootprint = target->parameterFootprint();
returnCode = target->returnCode();
tailCall = isTailCall(t, code, ip, context->method, target);
} else {
2014-06-29 04:57:07 +00:00
GcReference* ref = cast<GcReference>(t, reference);
PROTECT(t, ref);
argument = makePair(t, context->method, reference);
thunk = findInterfaceMethodFromInstanceAndReferenceThunk;
2014-07-11 15:47:57 +00:00
parameterFootprint = methodReferenceParameterFootprint(t, ref, false);
2014-06-29 04:57:07 +00:00
returnCode = methodReferenceReturnCode(t, ref);
2014-07-11 15:47:57 +00:00
tailCall = isReferenceTailCall(t, code, ip, context->method, ref);
}
unsigned rSize = resultSize(t, returnCode);
2014-06-01 20:22:14 +00:00
ir::Value* result = c->stackCall(
c->nativeCall(c->constant(getThunk(t, thunk), ir::Type::iptr()),
2014-07-17 00:07:56 +00:00
0,
frame->trace(0, 0),
ir::Type::iptr(),
args(c->threadRegister(),
frame->append(argument),
c->peek(1, parameterFootprint - 1))),
2014-06-01 20:22:14 +00:00
tailCall ? Compiler::TailJump : 0,
frame->trace(0, 0),
operandTypeForFieldCode(t, returnCode),
frame->peekMethodArguments(parameterFootprint));
frame->popFootprint(parameterFootprint);
if (rSize) {
frame->pushReturnValue(returnCode, result);
2008-02-11 17:21:41 +00:00
}
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case invokespecial: {
context->leaf = false;
2007-12-09 22:45:43 +00:00
uint16_t index = codeReadInt16(t, code, ip);
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
PROTECT(t, reference);
2014-05-29 04:17:25 +00:00
GcMethod* target = resolveMethod(t, context->method, index - 1, false);
if (LIKELY(target)) {
GcClass* class_ = context->method->class_();
if (isSpecialMethod(t, target, class_)) {
target = findVirtualMethod(t, target, class_->super());
}
checkMethod(t, target, false);
bool tailCall = isTailCall(t, code, ip, context->method, target);
if (UNLIKELY(methodAbstract(t, target))) {
2014-07-11 15:50:18 +00:00
compileDirectAbstractInvoke(
t, frame, getMethodAddressThunk, target, tailCall);
} else {
compileDirectInvoke(t, frame, target, tailCall);
}
} else {
2014-06-29 04:57:07 +00:00
GcReference* ref = cast<GcReference>(t, reference);
PROTECT(t, ref);
2014-07-11 15:47:57 +00:00
compileDirectReferenceInvoke(
t,
frame,
findSpecialMethodFromReferenceThunk,
ref,
false,
isReferenceTailCall(t, code, ip, context->method, ref));
}
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case invokestatic: {
context->leaf = false;
2007-12-09 22:45:43 +00:00
uint16_t index = codeReadInt16(t, code, ip);
2007-09-30 02:48:27 +00:00
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
2007-09-29 21:08:29 +00:00
PROTECT(t, reference);
2014-05-29 04:17:25 +00:00
GcMethod* target = resolveMethod(t, context->method, index - 1, false);
if (LIKELY(target)) {
checkMethod(t, target, true);
if (not intrinsic(t, frame, target)) {
bool tailCall = isTailCall(t, code, ip, context->method, target);
compileDirectInvoke(t, frame, target, tailCall);
}
} else {
2014-06-29 04:57:07 +00:00
GcReference* ref = cast<GcReference>(t, reference);
PROTECT(t, ref);
2014-07-11 15:47:57 +00:00
compileDirectReferenceInvoke(
t,
frame,
findStaticMethodFromReferenceThunk,
ref,
true,
isReferenceTailCall(t, code, ip, context->method, ref));
}
2007-12-09 22:45:43 +00:00
} break;
2007-09-29 21:08:29 +00:00
2007-12-09 22:45:43 +00:00
case invokevirtual: {
context->leaf = false;
2007-12-09 22:45:43 +00:00
uint16_t index = codeReadInt16(t, code, ip);
2007-09-29 21:08:29 +00:00
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
2007-09-29 21:08:29 +00:00
PROTECT(t, reference);
2014-05-29 04:17:25 +00:00
GcMethod* target = resolveMethod(t, context->method, index - 1, false);
if (LIKELY(target)) {
checkMethod(t, target, false);
2014-05-29 04:17:25 +00:00
if (not intrinsic(t, frame, target)) {
bool tailCall = isTailCall(t, code, ip, context->method, target);
2007-09-29 21:08:29 +00:00
if (LIKELY(methodVirtual(t, target))) {
2014-05-29 04:17:25 +00:00
unsigned parameterFootprint = target->parameterFootprint();
2007-09-29 21:08:29 +00:00
unsigned offset = TargetClassVtable
2014-07-11 15:47:57 +00:00
+ (target->offset() * TargetBytesPerWord);
2014-05-01 18:44:42 +00:00
ir::Value* instance = c->peek(1, parameterFootprint - 1);
frame->stackCall(
2014-06-01 20:22:14 +00:00
c->memory(c->binaryOp(
lir::And,
ir::Type::iptr(),
c->constant(TargetPointerMask, ir::Type::iptr()),
c->memory(instance, ir::Type::object())),
ir::Type::object(),
offset),
2014-05-01 19:56:39 +00:00
target,
tailCall ? Compiler::TailJump : 0,
2014-05-01 19:56:39 +00:00
frame->trace(0, 0));
} else {
// OpenJDK generates invokevirtual calls to private methods
// (e.g. readObject and writeObject for serialization), so
// we must handle such cases here.
compileDirectInvoke(t, frame, target, tailCall);
}
}
} else {
2014-06-29 04:57:07 +00:00
GcReference* ref = cast<GcReference>(t, reference);
PROTECT(t, reference);
2014-06-29 04:57:07 +00:00
PROTECT(t, ref);
GcPair* pair = makePair(t, context->method, reference);
compileReferenceInvoke(
frame,
c->nativeCall(
c->constant(getThunk(t, findVirtualMethodFromReferenceThunk),
2014-06-01 20:22:14 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
2014-06-01 20:22:14 +00:00
ir::Type::iptr(),
args(c->threadRegister(),
2014-07-17 00:07:56 +00:00
frame->append(pair),
c->peek(1,
methodReferenceParameterFootprint(t, ref, false)
- 1))),
2014-06-29 04:57:07 +00:00
ref,
false,
2014-06-29 04:57:07 +00:00
isReferenceTailCall(t, code, ip, context->method, ref));
2008-02-11 17:21:41 +00:00
}
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case irem: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->pop(ir::Type::i4());
ir::Value* b = frame->pop(ir::Type::i4());
if (inTryBlock(t, code, ip - 1)) {
c->saveLocals();
frame->trace(0, 0);
}
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->binaryOp(lir::Remainder, ir::Type::i4(), a, b));
2007-12-09 22:45:43 +00:00
} break;
2014-05-01 02:01:14 +00:00
case ireturn: {
handleExit(t, frame);
2014-06-01 20:22:14 +00:00
c->return_(frame->pop(ir::Type::i4()));
2014-05-01 02:01:14 +00:00
}
goto next;
case freturn: {
handleExit(t, frame);
2014-06-01 20:22:14 +00:00
c->return_(frame->pop(ir::Type::f4()));
2014-07-11 15:50:18 +00:00
}
goto next;
2007-12-09 22:45:43 +00:00
case istore:
2014-06-29 04:57:07 +00:00
frame->store(ir::Type::i4(), code->body()[ip++]);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 16:05:19 +00:00
case fstore:
2014-06-29 04:57:07 +00:00
frame->store(ir::Type::f4(), code->body()[ip++]);
2014-05-02 16:05:19 +00:00
break;
2007-12-09 22:45:43 +00:00
case istore_0:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::i4(), 0);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 16:05:19 +00:00
case fstore_0:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::f4(), 0);
2014-05-02 16:05:19 +00:00
break;
2007-12-09 22:45:43 +00:00
case istore_1:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::i4(), 1);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 16:05:19 +00:00
case fstore_1:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::f4(), 1);
2014-05-02 16:05:19 +00:00
break;
2007-12-09 22:45:43 +00:00
case istore_2:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::i4(), 2);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 16:05:19 +00:00
case fstore_2:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::f4(), 2);
2014-05-02 16:05:19 +00:00
break;
2007-12-09 22:45:43 +00:00
case istore_3:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::i4(), 3);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 16:05:19 +00:00
case fstore_3:
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::f4(), 3);
2014-05-02 16:05:19 +00:00
break;
2007-12-09 22:45:43 +00:00
case jsr:
case jsr_w: {
uint32_t thisIp;
if (instruction == jsr) {
uint32_t offset = codeReadInt16(t, code, ip);
thisIp = ip - 3;
newIp = thisIp + offset;
} else {
uint32_t offset = codeReadInt32(t, code, ip);
thisIp = ip - 5;
newIp = thisIp + offset;
}
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
frame->startSubroutine(newIp, ip);
c->jmp(frame->machineIpValue(newIp));
ip = newIp;
} break;
2008-03-21 00:37:58 +00:00
case l2d: {
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::f8(),
c->i2f(ir::Type::f8(), frame->popLarge(ir::Type::i8())));
2008-03-21 00:37:58 +00:00
} break;
case l2f: {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::f4(),
c->i2f(ir::Type::f4(), frame->popLarge(ir::Type::i8())));
2008-03-21 00:37:58 +00:00
} break;
case l2i:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->truncate(ir::Type::i4(), frame->popLarge(ir::Type::i8())));
break;
case ladd:
case land:
case lor:
case lsub:
case lxor:
case lmul: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->popLarge(ir::Type::i8());
ir::Value* b = frame->popLarge(ir::Type::i8());
frame->pushLarge(
2014-06-01 20:22:14 +00:00
ir::Type::i8(),
c->binaryOp(
toCompilerBinaryOp(t, instruction), ir::Type::i8(), a, b));
} break;
2007-12-09 22:45:43 +00:00
case lcmp: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->popLarge(ir::Type::i8());
ir::Value* b = frame->popLarge(ir::Type::i8());
if (integerBranch(t, frame, code, ip, a, b, &newIp)) {
goto branch;
} else {
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->nativeCall(c->constant(getThunk(t, compareLongsThunk),
2014-07-17 00:07:56 +00:00
ir::Type::iptr()),
0,
0,
ir::Type::i4(),
args(nullptr, a, nullptr, b)));
2009-10-07 00:50:32 +00:00
}
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case lconst_0:
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::i8(), c->constant(0, ir::Type::i8()));
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case lconst_1:
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::i8(), c->constant(1, ir::Type::i8()));
2007-12-09 22:45:43 +00:00
break;
2007-09-30 02:48:27 +00:00
2007-12-09 22:45:43 +00:00
case ldc:
case ldc_w: {
uint16_t index;
2007-09-30 02:48:27 +00:00
2007-12-09 22:45:43 +00:00
if (instruction == ldc) {
2014-06-29 04:57:07 +00:00
index = code->body()[ip++];
2007-12-09 22:45:43 +00:00
} else {
index = codeReadInt16(t, code, ip);
}
2007-09-30 15:52:21 +00:00
2014-06-29 04:57:07 +00:00
GcSingleton* pool = code->pool();
2007-09-30 15:52:21 +00:00
2007-12-09 22:45:43 +00:00
if (singletonIsObject(t, pool, index - 1)) {
object v = singletonObject(t, pool, index - 1);
2014-05-02 04:50:29 +00:00
loadMemoryBarrier();
2014-05-29 04:17:25 +00:00
if (objectClass(t, v) == type(t, GcReference::Type)) {
2014-06-29 04:57:07 +00:00
GcReference* reference = cast<GcReference>(t, v);
PROTECT(t, reference);
v = resolveClassInPool(t, context->method, index - 1, false);
if (UNLIKELY(v == 0)) {
frame->push(
2014-06-01 20:22:14 +00:00
ir::Type::object(),
c->nativeCall(
c->constant(getThunk(t, getJClassFromReferenceThunk),
2014-06-01 20:22:14 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
2014-06-01 20:22:14 +00:00
ir::Type::object(),
args(c->threadRegister(),
2014-07-17 00:07:56 +00:00
frame->append(
makePair(t, context->method, reference)))));
}
}
2007-09-30 15:52:21 +00:00
if (v) {
2014-05-29 04:17:25 +00:00
if (objectClass(t, v) == type(t, GcClass::Type)) {
2014-07-17 00:07:56 +00:00
frame->push(
ir::Type::object(),
c->nativeCall(c->constant(getThunk(t, getJClass64Thunk),
ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::object(),
args(c->threadRegister(), frame->append(v))));
} else {
frame->push(ir::Type::object(), frame->append(v));
}
}
2007-12-09 22:45:43 +00:00
} else {
ir::Type type = singletonBit(t, pool, poolSize(t, pool), index - 1)
2014-06-01 20:22:14 +00:00
? ir::Type::f4()
: ir::Type::i4();
frame->push(type,
c->constant(singletonValue(t, pool, index - 1), type));
2007-12-09 22:45:43 +00:00
}
} break;
2007-10-04 22:41:19 +00:00
2007-12-09 22:45:43 +00:00
case ldc2_w: {
uint16_t index = codeReadInt16(t, code, ip);
2014-06-29 04:57:07 +00:00
GcSingleton* pool = code->pool();
2007-12-09 22:45:43 +00:00
uint64_t v;
memcpy(&v, &singletonValue(t, pool, index - 1), 8);
ir::Type type = singletonBit(t, pool, poolSize(t, pool), index - 1)
2014-06-01 20:22:14 +00:00
? ir::Type::f8()
: ir::Type::i8();
frame->pushLarge(type, c->constant(v, type));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case ldiv_: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->popLarge(ir::Type::i8());
ir::Value* b = frame->popLarge(ir::Type::i8());
if (inTryBlock(t, code, ip - 1)) {
c->saveLocals();
frame->trace(0, 0);
}
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::i8(),
c->binaryOp(lir::Divide, ir::Type::i8(), a, b));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case lload:
2014-06-29 04:57:07 +00:00
frame->loadLarge(ir::Type::i8(), code->body()[ip++]);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 15:01:57 +00:00
case dload:
2014-06-29 04:57:07 +00:00
frame->loadLarge(ir::Type::f8(), code->body()[ip++]);
2014-05-02 15:01:57 +00:00
break;
2007-12-09 22:45:43 +00:00
case lload_0:
2014-06-01 20:22:14 +00:00
frame->loadLarge(ir::Type::i8(), 0);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 15:01:57 +00:00
case dload_0:
2014-06-01 20:22:14 +00:00
frame->loadLarge(ir::Type::f8(), 0);
2014-05-02 15:01:57 +00:00
break;
2007-12-09 22:45:43 +00:00
case lload_1:
2014-06-01 20:22:14 +00:00
frame->loadLarge(ir::Type::i8(), 1);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 15:01:57 +00:00
case dload_1:
2014-06-01 20:22:14 +00:00
frame->loadLarge(ir::Type::f8(), 1);
2014-05-02 15:01:57 +00:00
break;
2007-12-09 22:45:43 +00:00
case lload_2:
2014-06-01 20:22:14 +00:00
frame->loadLarge(ir::Type::i8(), 2);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 15:01:57 +00:00
case dload_2:
2014-06-01 20:22:14 +00:00
frame->loadLarge(ir::Type::f8(), 2);
2014-05-02 15:01:57 +00:00
break;
2007-12-09 22:45:43 +00:00
case lload_3:
2014-06-01 20:22:14 +00:00
frame->loadLarge(ir::Type::i8(), 3);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 15:01:57 +00:00
case dload_3:
2014-06-01 20:22:14 +00:00
frame->loadLarge(ir::Type::f8(), 3);
2014-05-02 15:01:57 +00:00
break;
2007-12-09 22:45:43 +00:00
case lneg:
2014-06-01 20:22:14 +00:00
frame->pushLarge(
ir::Type::i8(),
c->unaryOp(lir::Negate, frame->popLarge(ir::Type::i8())));
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case lookupswitch: {
int32_t base = ip - 1;
2014-07-11 15:50:18 +00:00
ip = (ip + 3) & ~3; // pad to four byte boundary
2014-06-01 20:22:14 +00:00
ir::Value* key = frame->pop(ir::Type::i4());
2014-05-01 18:44:42 +00:00
2007-12-09 22:45:43 +00:00
uint32_t defaultIp = base + codeReadInt32(t, code, ip);
2014-06-29 04:57:07 +00:00
assertT(t, defaultIp < code->length());
2007-12-09 22:45:43 +00:00
int32_t pairCount = codeReadInt32(t, code, ip);
if (pairCount) {
2014-05-01 18:44:42 +00:00
ir::Value* default_ = frame->addressOperand(
frame->addressPromise(frame->machineIp(defaultIp)));
avian::codegen::Promise* start = 0;
2014-07-11 15:50:18 +00:00
uint32_t* ipTable
= static_cast<uint32_t*>(stack.push(sizeof(uint32_t) * pairCount));
for (int32_t i = 0; i < pairCount; ++i) {
unsigned index = ip + (i * 8);
int32_t key = codeReadInt32(t, code, index);
uint32_t newIp = base + codeReadInt32(t, code, index);
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2012-10-13 19:09:24 +00:00
ipTable[i] = newIp;
avian::codegen::Promise* p = c->poolAppend(key);
if (i == 0) {
start = p;
}
c->poolAppendPromise(frame->addressPromise(frame->machineIp(newIp)));
2007-12-09 22:45:43 +00:00
}
assertT(t, start);
ir::Value* address = c->nativeCall(
2014-06-01 20:22:14 +00:00
c->constant(getThunk(t, lookUpAddressThunk), ir::Type::iptr()),
0,
0,
2014-06-01 20:22:14 +00:00
ir::Type::iptr(),
args(key,
frame->absoluteAddressOperand(start),
c->constant(pairCount, ir::Type::i4()),
default_));
c->jmp(context->bootContext
? c->binaryOp(lir::Add,
2014-06-01 20:22:14 +00:00
ir::Type::iptr(),
c->memory(c->threadRegister(),
2014-06-01 20:22:14 +00:00
ir::Type::iptr(),
TARGET_THREAD_CODEIMAGE),
address)
: address);
2007-12-16 00:24:15 +00:00
2014-07-11 15:50:18 +00:00
new (stack.push(sizeof(SwitchState)))
SwitchState(c->saveState(), pairCount, defaultIp, 0, 0, 0, 0);
goto switchloop;
} else {
// a switch statement with no cases, apparently
c->jmp(frame->machineIpValue(defaultIp));
ip = defaultIp;
2007-12-16 00:24:15 +00:00
}
2008-01-07 14:51:07 +00:00
} break;
2007-12-09 22:45:43 +00:00
case lrem: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->popLarge(ir::Type::i8());
ir::Value* b = frame->popLarge(ir::Type::i8());
if (inTryBlock(t, code, ip - 1)) {
c->saveLocals();
frame->trace(0, 0);
}
2014-06-01 20:22:14 +00:00
frame->pushLarge(ir::Type::i8(),
c->binaryOp(lir::Remainder, ir::Type::i8(), a, b));
2007-12-09 22:45:43 +00:00
} break;
2014-05-01 02:01:14 +00:00
case lreturn: {
handleExit(t, frame);
2014-06-01 20:22:14 +00:00
c->return_(frame->popLarge(ir::Type::i8()));
2014-05-01 02:01:14 +00:00
}
goto next;
case dreturn: {
handleExit(t, frame);
2014-06-01 20:22:14 +00:00
c->return_(frame->popLarge(ir::Type::f8()));
2014-07-11 15:50:18 +00:00
}
goto next;
case lshl:
case lshr:
case lushr: {
2014-06-01 20:22:14 +00:00
ir::Value* a = frame->pop(ir::Type::i4());
ir::Value* b = frame->popLarge(ir::Type::i8());
frame->pushLarge(
2014-06-01 20:22:14 +00:00
ir::Type::i8(),
c->binaryOp(
toCompilerBinaryOp(t, instruction), ir::Type::i8(), a, b));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case lstore:
2014-06-29 04:57:07 +00:00
frame->storeLarge(ir::Type::i8(), code->body()[ip++]);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 16:05:19 +00:00
case dstore:
2014-06-29 04:57:07 +00:00
frame->storeLarge(ir::Type::f8(), code->body()[ip++]);
2014-05-02 16:05:19 +00:00
break;
2007-12-09 22:45:43 +00:00
case lstore_0:
2014-06-01 20:22:14 +00:00
frame->storeLarge(ir::Type::i8(), 0);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 16:05:19 +00:00
case dstore_0:
2014-06-01 20:22:14 +00:00
frame->storeLarge(ir::Type::f8(), 0);
2014-05-02 16:05:19 +00:00
break;
2007-12-09 22:45:43 +00:00
case lstore_1:
2014-06-01 20:22:14 +00:00
frame->storeLarge(ir::Type::i8(), 1);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 16:05:19 +00:00
case dstore_1:
2014-06-01 20:22:14 +00:00
frame->storeLarge(ir::Type::f8(), 1);
2014-05-02 16:05:19 +00:00
break;
2007-12-09 22:45:43 +00:00
case lstore_2:
2014-06-01 20:22:14 +00:00
frame->storeLarge(ir::Type::i8(), 2);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 16:05:19 +00:00
case dstore_2:
2014-06-01 20:22:14 +00:00
frame->storeLarge(ir::Type::f8(), 2);
2014-05-02 16:05:19 +00:00
break;
2007-12-09 22:45:43 +00:00
case lstore_3:
2014-06-01 20:22:14 +00:00
frame->storeLarge(ir::Type::i8(), 3);
2007-12-09 22:45:43 +00:00
break;
2014-05-02 16:05:19 +00:00
case dstore_3:
2014-06-01 20:22:14 +00:00
frame->storeLarge(ir::Type::f8(), 3);
2014-05-02 16:05:19 +00:00
break;
2007-12-09 22:45:43 +00:00
case monitorenter: {
2014-06-01 20:22:14 +00:00
ir::Value* target = frame->pop(ir::Type::object());
c->nativeCall(c->constant(getThunk(t, acquireMonitorForObjectThunk),
2014-07-17 00:07:56 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(), target));
2007-12-09 22:45:43 +00:00
} break;
2007-09-29 21:08:29 +00:00
2007-12-09 22:45:43 +00:00
case monitorexit: {
2014-06-01 20:22:14 +00:00
ir::Value* target = frame->pop(ir::Type::object());
c->nativeCall(c->constant(getThunk(t, releaseMonitorForObjectThunk),
2014-07-17 00:07:56 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(), target));
2007-12-09 22:45:43 +00:00
} break;
2007-09-29 21:08:29 +00:00
2007-12-09 22:45:43 +00:00
case multianewarray: {
uint16_t index = codeReadInt16(t, code, ip);
2014-06-29 04:57:07 +00:00
uint8_t dimensions = code->body()[ip++];
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
PROTECT(t, reference);
2014-07-11 15:47:57 +00:00
GcClass* class_
= resolveClassInPool(t, context->method, index - 1, false);
object argument;
Thunk thunk;
if (LIKELY(class_)) {
argument = class_;
thunk = makeMultidimensionalArrayThunk;
} else {
argument = makePair(t, context->method, reference);
thunk = makeMultidimensionalArrayFromReferenceThunk;
}
unsigned offset
2014-07-11 15:50:18 +00:00
= localOffset(t,
localSize(t, context->method) + c->topOfStack(),
context->method) + t->arch->frameReturnAddressSize();
2008-11-11 00:07:44 +00:00
2014-05-01 18:44:42 +00:00
ir::Value* result
= c->nativeCall(c->constant(getThunk(t, thunk), ir::Type::iptr()),
2014-07-17 00:07:56 +00:00
0,
frame->trace(0, 0),
ir::Type::object(),
args(c->threadRegister(),
frame->append(argument),
c->constant(dimensions, ir::Type::i4()),
c->constant(offset, ir::Type::i4())));
2014-06-01 20:22:14 +00:00
frame->popFootprint(dimensions);
frame->push(ir::Type::object(), result);
2007-12-09 22:45:43 +00:00
} break;
2007-10-12 00:30:46 +00:00
2007-12-09 22:45:43 +00:00
case new_: {
uint16_t index = codeReadInt16(t, code, ip);
2014-05-29 04:17:25 +00:00
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
2007-12-09 22:45:43 +00:00
PROTECT(t, reference);
2014-07-11 15:47:57 +00:00
GcClass* class_
= resolveClassInPool(t, context->method, index - 1, false);
object argument;
Thunk thunk;
if (LIKELY(class_)) {
argument = class_;
2014-05-29 04:17:25 +00:00
if (class_->vmFlags() & (WeakReferenceFlag | HasFinalizerFlag)) {
thunk = makeNewGeneral64Thunk;
} else {
thunk = makeNew64Thunk;
}
2007-12-09 22:45:43 +00:00
} else {
2014-07-11 15:47:57 +00:00
argument = makePair(t, context->method, reference);
thunk = makeNewFromReferenceThunk;
2007-12-09 22:45:43 +00:00
}
2014-07-17 00:07:56 +00:00
frame->push(
ir::Type::object(),
c->nativeCall(c->constant(getThunk(t, thunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::object(),
args(c->threadRegister(), frame->append(argument))));
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case newarray: {
2014-06-29 04:57:07 +00:00
uint8_t type = code->body()[ip++];
2014-06-01 20:22:14 +00:00
ir::Value* length = frame->pop(ir::Type::i4());
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::object(),
c->nativeCall(c->constant(getThunk(t, makeBlankArrayThunk),
2014-07-17 00:07:56 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::object(),
args(c->threadRegister(),
c->constant(type, ir::Type::i4()),
length)));
2007-12-09 22:45:43 +00:00
} break;
2014-07-11 15:50:18 +00:00
case nop:
break;
2007-12-09 22:45:43 +00:00
case pop_:
2014-06-01 20:22:14 +00:00
frame->popFootprint(1);
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case pop2:
2014-06-01 20:22:14 +00:00
frame->popFootprint(2);
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case putfield:
case putstatic: {
uint16_t index = codeReadInt16(t, code, ip);
2014-05-29 04:17:25 +00:00
2014-07-11 15:47:57 +00:00
object reference
= singletonObject(t, context->method->code()->pool(), index - 1);
PROTECT(t, reference);
2014-06-29 04:57:07 +00:00
GcField* field = resolveField(t, context->method, index - 1, false);
if (LIKELY(field)) {
2014-06-29 04:57:07 +00:00
int fieldCode = field->code();
object staticTable = 0;
if (instruction == putstatic) {
checkField(t, field, true);
2014-06-29 04:57:07 +00:00
if (classNeedsInit(t, field->class_())) {
PROTECT(t, field);
2007-10-12 22:06:33 +00:00
c->nativeCall(
2014-06-01 20:22:14 +00:00
c->constant(getThunk(t, tryInitClassThunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
2014-07-17 00:07:56 +00:00
args(c->threadRegister(), frame->append(field->class_())));
}
staticTable = field->class_()->staticTable();
} else {
checkField(t, field, false);
if (inTryBlock(t, code, ip - 3)) {
c->saveLocals();
frame->trace(0, 0);
}
}
2014-06-29 04:57:07 +00:00
if (field->flags() & ACC_VOLATILE) {
if (TargetBytesPerWord == 4
2014-07-11 15:50:18 +00:00
and (fieldCode == DoubleField or fieldCode == LongField)) {
PROTECT(t, field);
c->nativeCall(c->constant(getThunk(t, acquireMonitorForObjectThunk),
2014-07-17 00:07:56 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(), frame->append(field)));
} else {
c->nullaryOp(lir::StoreStoreBarrier);
}
}
2014-05-01 18:44:42 +00:00
ir::Value* value = popField(t, frame, fieldCode);
2014-05-01 18:44:42 +00:00
ir::Value* table;
if (instruction == putstatic) {
PROTECT(t, field);
table = frame->append(staticTable);
} else {
2014-06-01 20:22:14 +00:00
table = frame->pop(ir::Type::object());
}
switch (fieldCode) {
case ByteField:
case BooleanField:
c->store(
value,
2014-06-01 20:22:14 +00:00
c->memory(
table, ir::Type::i1(), targetFieldOffset(context, field)));
break;
case CharField:
case ShortField:
c->store(
value,
2014-06-01 20:22:14 +00:00
c->memory(
table, ir::Type::i2(), targetFieldOffset(context, field)));
break;
2014-05-02 15:01:57 +00:00
case FloatField:
c->store(
value,
2014-06-01 20:22:14 +00:00
c->memory(
table, ir::Type::f4(), targetFieldOffset(context, field)));
break;
case IntField:
c->store(
value,
2014-06-01 20:22:14 +00:00
c->memory(
table, ir::Type::i4(), targetFieldOffset(context, field)));
break;
case DoubleField:
c->store(
value,
2014-06-01 20:22:14 +00:00
c->memory(
table, ir::Type::f8(), targetFieldOffset(context, field)));
break;
case LongField:
c->store(
value,
2014-06-01 20:22:14 +00:00
c->memory(
table, ir::Type::i8(), targetFieldOffset(context, field)));
break;
case ObjectField:
if (instruction == putfield) {
c->nativeCall(
2014-06-01 20:22:14 +00:00
c->constant(getThunk(t, setMaybeNullThunk), ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(),
2014-07-17 00:07:56 +00:00
table,
c->constant(targetFieldOffset(context, field),
ir::Type::i4()),
value));
} else {
c->nativeCall(
2014-06-28 20:41:27 +00:00
c->constant(getThunk(t, setObjectThunk), ir::Type::iptr()),
2014-06-01 20:22:14 +00:00
0,
0,
ir::Type::void_(),
args(c->threadRegister(),
2014-07-17 00:07:56 +00:00
table,
c->constant(targetFieldOffset(context, field),
ir::Type::i4()),
value));
}
break;
2014-07-11 15:50:18 +00:00
default:
abort(t);
2007-12-30 22:24:48 +00:00
}
2014-06-29 04:57:07 +00:00
if (field->flags() & ACC_VOLATILE) {
if (TargetBytesPerWord == 4
2014-07-11 15:50:18 +00:00
and (fieldCode == DoubleField or fieldCode == LongField)) {
c->nativeCall(c->constant(getThunk(t, releaseMonitorForObjectThunk),
2014-07-17 00:07:56 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
ir::Type::void_(),
args(c->threadRegister(), frame->append(field)));
} else {
c->nullaryOp(lir::StoreLoadBarrier);
}
}
} else {
2014-06-29 04:57:07 +00:00
GcReference* ref = cast<GcReference>(t, reference);
PROTECT(t, ref);
2014-07-11 15:47:57 +00:00
int fieldCode = vm::fieldCode(t, ref->spec()->body()[0]);
2014-05-01 18:44:42 +00:00
ir::Value* value = popField(t, frame, fieldCode);
ir::Type rType = operandTypeForFieldCode(t, fieldCode);
GcPair* pair = makePair(t, context->method, reference);
switch (fieldCode) {
case ByteField:
case BooleanField:
case CharField:
case ShortField:
case FloatField:
case IntField: {
if (instruction == putstatic) {
c->nativeCall(
c->constant(getThunk(t, setStaticFieldValueFromReferenceThunk),
2014-06-01 20:22:14 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
rType,
2014-07-17 00:07:56 +00:00
args(c->threadRegister(), frame->append(pair), value));
} else {
2014-06-01 20:22:14 +00:00
ir::Value* instance = frame->pop(ir::Type::object());
2014-07-17 00:07:56 +00:00
c->nativeCall(
c->constant(getThunk(t, setFieldValueFromReferenceThunk),
ir::Type::iptr()),
0,
frame->trace(0, 0),
rType,
args(
c->threadRegister(), frame->append(pair), instance, value));
}
} break;
case DoubleField:
case LongField: {
if (instruction == putstatic) {
2014-07-17 00:07:56 +00:00
c->nativeCall(
c->constant(
getThunk(t, setStaticLongFieldValueFromReferenceThunk),
ir::Type::iptr()),
0,
frame->trace(0, 0),
rType,
args(c->threadRegister(), frame->append(pair), nullptr, value));
} else {
2014-06-01 20:22:14 +00:00
ir::Value* instance = frame->pop(ir::Type::object());
c->nativeCall(
c->constant(getThunk(t, setLongFieldValueFromReferenceThunk),
2014-06-01 20:22:14 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
rType,
args(c->threadRegister(),
2014-07-17 00:07:56 +00:00
frame->append(pair),
instance,
nullptr,
value));
}
} break;
case ObjectField: {
if (instruction == putstatic) {
c->nativeCall(
c->constant(
getThunk(t, setStaticObjectFieldValueFromReferenceThunk),
2014-06-01 20:22:14 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
rType,
2014-07-17 00:07:56 +00:00
args(c->threadRegister(), frame->append(pair), value));
} else {
2014-06-01 20:22:14 +00:00
ir::Value* instance = frame->pop(ir::Type::object());
c->nativeCall(
c->constant(getThunk(t, setObjectFieldValueFromReferenceThunk),
2014-06-01 20:22:14 +00:00
ir::Type::iptr()),
0,
frame->trace(0, 0),
rType,
2014-07-17 00:07:56 +00:00
args(
c->threadRegister(), frame->append(pair), instance, value));
}
} break;
2009-03-03 03:18:15 +00:00
2014-07-11 15:50:18 +00:00
default:
abort(t);
}
2009-03-03 03:18:15 +00:00
}
2007-12-09 22:45:43 +00:00
} break;
case ret: {
2014-06-29 04:57:07 +00:00
unsigned index = code->body()[ip];
unsigned returnAddress = frame->endSubroutine(index);
c->jmp(frame->machineIpValue(returnAddress));
ip = returnAddress;
} break;
2007-12-09 22:45:43 +00:00
case return_:
if (needsReturnBarrier(t, context->method)) {
c->nullaryOp(lir::StoreStoreBarrier);
}
handleExit(t, frame);
2014-05-01 02:01:14 +00:00
c->return_();
goto next;
2007-12-09 22:45:43 +00:00
case sipush:
2014-06-01 20:22:14 +00:00
frame->push(ir::Type::i4(),
c->constant(static_cast<int16_t>(codeReadInt16(t, code, ip)),
2014-06-01 20:22:14 +00:00
ir::Type::i4()));
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case swap:
frame->swap();
break;
2007-12-09 22:45:43 +00:00
case tableswitch: {
int32_t base = ip - 1;
2014-07-11 15:50:18 +00:00
ip = (ip + 3) & ~3; // pad to four byte boundary
2007-09-30 02:48:27 +00:00
2007-12-09 22:45:43 +00:00
uint32_t defaultIp = base + codeReadInt32(t, code, ip);
2014-06-29 04:57:07 +00:00
assertT(t, defaultIp < code->length());
2014-05-29 04:17:25 +00:00
2007-12-09 22:45:43 +00:00
int32_t bottom = codeReadInt32(t, code, ip);
int32_t top = codeReadInt32(t, code, ip);
2014-05-29 04:17:25 +00:00
avian::codegen::Promise* start = 0;
unsigned count = top - bottom + 1;
2014-07-11 15:50:18 +00:00
uint32_t* ipTable
= static_cast<uint32_t*>(stack.push(sizeof(uint32_t) * count));
2007-12-16 00:24:15 +00:00
for (int32_t i = 0; i < top - bottom + 1; ++i) {
2007-12-09 22:45:43 +00:00
unsigned index = ip + (i * 4);
uint32_t newIp = base + codeReadInt32(t, code, index);
2014-06-29 04:57:07 +00:00
assertT(t, newIp < code->length());
2012-10-13 19:09:24 +00:00
ipTable[i] = newIp;
2007-12-16 00:24:15 +00:00
avian::codegen::Promise* p = c->poolAppendPromise(
frame->addressPromise(frame->machineIp(newIp)));
2007-12-09 22:45:43 +00:00
if (i == 0) {
start = p;
}
2007-12-09 22:45:43 +00:00
}
assertT(t, start);
2014-06-01 20:22:14 +00:00
ir::Value* key = frame->pop(ir::Type::i4());
c->condJump(lir::JumpIfLess,
2014-06-01 20:22:14 +00:00
c->constant(bottom, ir::Type::i4()),
key,
frame->machineIpValue(defaultIp));
2008-09-20 23:42:46 +00:00
2014-06-01 20:22:14 +00:00
c->save(ir::Type::i4(), key);
2014-07-11 15:50:18 +00:00
new (stack.push(sizeof(SwitchState))) SwitchState(
c->saveState(), count, defaultIp, key, start, bottom, top);
2007-12-16 00:24:15 +00:00
stack.pushValue(Untable0);
2008-01-07 14:51:07 +00:00
ip = defaultIp;
2014-07-11 15:50:18 +00:00
}
goto start;
2007-12-09 22:45:43 +00:00
case wide: {
2014-06-29 04:57:07 +00:00
switch (code->body()[ip++]) {
2007-12-09 22:45:43 +00:00
case aload: {
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::object(), codeReadInt16(t, code, ip));
2007-10-04 22:41:19 +00:00
} break;
2007-12-09 22:45:43 +00:00
case astore: {
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::object(), codeReadInt16(t, code, ip));
2007-12-09 22:45:43 +00:00
} break;
2007-10-04 22:41:19 +00:00
2007-12-09 22:45:43 +00:00
case iinc: {
uint16_t index = codeReadInt16(t, code, ip);
int16_t count = codeReadInt16(t, code, ip);
2007-10-04 22:41:19 +00:00
storeLocal(context,
1,
2014-06-01 20:22:14 +00:00
ir::Type::i4(),
c->binaryOp(lir::Add,
2014-06-01 20:22:14 +00:00
ir::Type::i4(),
c->constant(count, ir::Type::i4()),
loadLocal(context, 1, ir::Type::i4(), index)),
index);
2007-12-09 22:45:43 +00:00
} break;
2007-10-04 22:41:19 +00:00
2007-12-09 22:45:43 +00:00
case iload: {
2014-06-01 20:22:14 +00:00
frame->load(ir::Type::i4(), codeReadInt16(t, code, ip));
2007-12-09 22:45:43 +00:00
} break;
2007-10-04 22:41:19 +00:00
2007-12-09 22:45:43 +00:00
case istore: {
2014-06-01 20:22:14 +00:00
frame->store(ir::Type::i4(), codeReadInt16(t, code, ip));
2007-12-09 22:45:43 +00:00
} break;
2007-10-04 22:41:19 +00:00
2007-12-09 22:45:43 +00:00
case lload: {
2014-06-01 20:22:14 +00:00
frame->loadLarge(ir::Type::i8(), codeReadInt16(t, code, ip));
2007-12-09 22:45:43 +00:00
} break;
2007-10-04 22:41:19 +00:00
2007-12-09 22:45:43 +00:00
case lstore: {
2014-06-01 20:22:14 +00:00
frame->storeLarge(ir::Type::i8(), codeReadInt16(t, code, ip));
2007-12-09 22:45:43 +00:00
} break;
2007-10-12 14:26:36 +00:00
case ret: {
unsigned index = codeReadInt16(t, code, ip);
unsigned returnAddress = frame->endSubroutine(index);
c->jmp(frame->machineIpValue(returnAddress));
ip = returnAddress;
} break;
2007-10-04 22:41:19 +00:00
2014-07-11 15:50:18 +00:00
default:
abort(t);
2007-12-09 22:45:43 +00:00
}
} break;
2014-07-11 15:50:18 +00:00
default:
abort(t);
2007-12-09 22:45:43 +00:00
}
}
2014-07-11 15:50:18 +00:00
next:
frame->dispose();
frame = 0;
stack.pop(sizeof(Frame));
2014-05-05 16:49:50 +00:00
stack.pop(stackSize * sizeof(ir::Type));
switch (stack.popValue()) {
case Return:
return;
case Unbranch:
if (DebugInstructions) {
fprintf(stderr, "Unbranch\n");
}
ip = stack.popValue();
c->restoreState(reinterpret_cast<Compiler::State*>(stack.popValue()));
frame = static_cast<Frame*>(stack.peek(sizeof(Frame)));
goto loop;
case Untable0: {
if (DebugInstructions) {
fprintf(stderr, "Untable0\n");
}
2014-07-11 15:50:18 +00:00
SwitchState* s = static_cast<SwitchState*>(stack.peek(sizeof(SwitchState)));
frame = s->frame();
c->restoreState(s->state);
c->condJump(lir::JumpIfGreater,
2014-06-01 20:22:14 +00:00
c->constant(s->top, ir::Type::i4()),
s->key,
frame->machineIpValue(s->defaultIp));
2014-05-01 02:20:19 +00:00
2014-06-01 20:22:14 +00:00
c->save(ir::Type::i4(), s->key);
ip = s->defaultIp;
stack.pushValue(Untable1);
2014-07-11 15:50:18 +00:00
}
goto start;
case Untable1: {
if (DebugInstructions) {
fprintf(stderr, "Untable1\n");
}
2014-07-11 15:50:18 +00:00
SwitchState* s = static_cast<SwitchState*>(stack.peek(sizeof(SwitchState)));
frame = s->frame();
c->restoreState(s->state);
2014-05-01 18:44:42 +00:00
ir::Value* normalizedKey
2014-06-01 20:22:14 +00:00
= (s->bottom
? c->binaryOp(lir::Subtract,
ir::Type::i4(),
c->constant(s->bottom, ir::Type::i4()),
s->key)
: s->key);
2014-05-01 18:44:42 +00:00
ir::Value* entry = c->memory(frame->absoluteAddressOperand(s->start),
2014-06-01 20:22:14 +00:00
ir::Type::iptr(),
2014-05-01 18:44:42 +00:00
0,
normalizedKey);
2014-07-12 17:54:19 +00:00
c->jmp(c->load(ir::ExtendMode::Signed,
context->bootContext
? c->binaryOp(lir::Add,
2014-06-01 20:22:14 +00:00
ir::Type::iptr(),
c->memory(c->threadRegister(),
2014-06-01 20:22:14 +00:00
ir::Type::iptr(),
TARGET_THREAD_CODEIMAGE),
entry)
: entry,
2014-06-01 20:22:14 +00:00
ir::Type::iptr()));
s->state = c->saveState();
2014-07-11 15:50:18 +00:00
}
goto switchloop;
case Unswitch: {
if (DebugInstructions) {
fprintf(stderr, "Unswitch\n");
}
2014-07-11 15:50:18 +00:00
SwitchState* s = static_cast<SwitchState*>(stack.peek(sizeof(SwitchState)));
frame = s->frame();
2014-07-11 15:50:18 +00:00
c->restoreState(
static_cast<SwitchState*>(stack.peek(sizeof(SwitchState)))->state);
}
goto switchloop;
case Unsubroutine: {
if (DebugInstructions) {
fprintf(stderr, "Unsubroutine\n");
}
ip = stack.popValue();
unsigned start = stack.popValue();
frame = reinterpret_cast<Frame*>(stack.peek(sizeof(Frame)));
frame->endSubroutine(start);
2014-07-11 15:50:18 +00:00
}
goto loop;
default:
abort(t);
}
2014-07-11 15:50:18 +00:00
switchloop : {
SwitchState* s = static_cast<SwitchState*>(stack.peek(sizeof(SwitchState)));
2014-07-11 15:50:18 +00:00
if (s->index < s->count) {
ip = s->ipTable()[s->index++];
stack.pushValue(Unswitch);
goto start;
} else {
ip = s->defaultIp;
unsigned count = s->count * 4;
stack.pop(sizeof(SwitchState));
stack.pop(count);
frame = reinterpret_cast<Frame*>(stack.peek(sizeof(Frame)));
goto loop;
}
2014-07-11 15:50:18 +00:00
}
2014-07-11 15:50:18 +00:00
branch:
stack.pushValue(reinterpret_cast<uintptr_t>(c->saveState()));
stack.pushValue(ip);
stack.pushValue(Unbranch);
ip = newIp;
goto start;
2007-12-09 22:45:43 +00:00
}
2007-10-04 22:41:19 +00:00
2014-07-11 15:50:18 +00:00
int resolveIpForwards(Context* context, int start, int end)
{
if (start < 0) {
start = 0;
}
while (start < end and context->visitTable[start] == 0) {
2014-07-11 15:50:18 +00:00
++start;
}
2014-05-29 04:17:25 +00:00
if (start >= end) {
return -1;
} else {
return start;
}
}
2014-07-11 15:50:18 +00:00
int resolveIpBackwards(Context* context, int start, int end)
{
2014-06-28 04:00:05 +00:00
if (start >= static_cast<int>(context->method->code()->length()
* (context->subroutineCount + 1))) {
2014-06-28 04:00:05 +00:00
start = context->method->code()->length();
} else {
while (start >= end and context->visitTable[start] == 0) {
2014-07-11 15:50:18 +00:00
--start;
}
}
2014-05-29 04:17:25 +00:00
if (start < end) {
return -1;
} else {
return start;
}
}
2014-07-11 15:47:57 +00:00
GcIntArray* truncateIntArray(Thread* t, GcIntArray* array, unsigned length)
{
2014-06-29 04:57:07 +00:00
expect(t, array->length() > length);
PROTECT(t, array);
2014-06-29 04:57:07 +00:00
GcIntArray* newArray = makeIntArray(t, length);
if (length) {
2014-07-11 15:47:57 +00:00
memcpy(newArray->body().begin(), array->body().begin(), length * 4);
}
return newArray;
}
2014-07-11 15:47:57 +00:00
GcArray* truncateArray(Thread* t, GcArray* array, unsigned length)
{
2014-06-29 04:57:07 +00:00
expect(t, array->length() > length);
PROTECT(t, array);
2014-06-29 04:57:07 +00:00
GcArray* newArray = makeArray(t, length);
if (length) {
2014-07-11 15:47:57 +00:00
for (size_t i = 0; i < length; i++) {
2014-06-25 20:38:13 +00:00
newArray->setBodyElement(t, i, array->body()[i]);
}
}
return newArray;
}
2014-07-11 15:47:57 +00:00
GcLineNumberTable* truncateLineNumberTable(Thread* t,
GcLineNumberTable* table,
unsigned length)
{
2014-06-29 04:57:07 +00:00
expect(t, table->length() > length);
PROTECT(t, table);
2014-06-29 04:57:07 +00:00
GcLineNumberTable* newTable = makeLineNumberTable(t, length);
if (length) {
2014-06-29 04:57:07 +00:00
memcpy(newTable->body().begin(),
table->body().begin(),
length * sizeof(uint64_t));
}
return newTable;
}
2014-06-29 04:57:07 +00:00
GcArray* translateExceptionHandlerTable(MyThread* t,
2014-07-11 15:47:57 +00:00
Context* context,
intptr_t start,
intptr_t end)
2008-01-07 14:51:07 +00:00
{
avian::codegen::Compiler* c = context->compiler;
2014-07-11 15:47:57 +00:00
GcExceptionHandlerTable* oldTable = cast<GcExceptionHandlerTable>(
t, context->method->code()->exceptionHandlerTable());
2008-01-07 14:51:07 +00:00
if (oldTable) {
PROTECT(t, oldTable);
2014-06-29 04:57:07 +00:00
unsigned length = oldTable->length();
2014-06-29 04:57:07 +00:00
GcIntArray* newIndex
= makeIntArray(t, length * (context->subroutineCount + 1) * 3);
PROTECT(t, newIndex);
2014-07-11 15:47:57 +00:00
GcArray* newTable
= makeArray(t, length * (context->subroutineCount + 1) + 1);
PROTECT(t, newTable);
unsigned ni = 0;
for (unsigned subI = 0; subI <= context->subroutineCount; ++subI) {
2014-07-11 15:47:57 +00:00
unsigned duplicatedBaseIp = subI * context->method->code()->length();
for (unsigned oi = 0; oi < length; ++oi) {
2014-06-29 04:57:07 +00:00
uint64_t oldHandler = oldTable->body()[oi];
int handlerStart = resolveIpForwards(
context,
duplicatedBaseIp + exceptionHandlerStart(oldHandler),
duplicatedBaseIp + exceptionHandlerEnd(oldHandler));
if (LIKELY(handlerStart >= 0)) {
2014-07-11 15:47:57 +00:00
assertT(t,
handlerStart
< static_cast<int>(context->method->code()->length()
* (context->subroutineCount + 1)));
int handlerEnd = resolveIpBackwards(
context,
duplicatedBaseIp + exceptionHandlerEnd(oldHandler),
duplicatedBaseIp + exceptionHandlerStart(oldHandler));
assertT(t, handlerEnd >= 0);
2014-07-11 15:47:57 +00:00
assertT(
t,
handlerEnd <= static_cast<int>(context->method->code()->length()
* (context->subroutineCount + 1)));
2014-07-11 15:47:57 +00:00
newIndex->body()[ni * 3] = c->machineIp(handlerStart)->value()
- start;
2014-07-11 15:47:57 +00:00
newIndex->body()[(ni * 3) + 1]
= (handlerEnd
== static_cast<int>(context->method->code()->length())
? end
: c->machineIp(handlerEnd)->value()) - start;
2014-07-11 15:47:57 +00:00
newIndex->body()[(ni * 3) + 2]
= c->machineIp(exceptionHandlerIp(oldHandler))->value() - start;
object type;
if (exceptionHandlerCatchType(oldHandler)) {
type = resolveClassInPool(
t, context->method, exceptionHandlerCatchType(oldHandler) - 1);
} else {
type = 0;
}
2014-06-25 20:38:13 +00:00
newTable->setBodyElement(t, ni + 1, type);
++ni;
}
}
}
if (UNLIKELY(ni < length)) {
newIndex = truncateIntArray(t, newIndex, ni * 3);
newTable = truncateArray(t, newTable, ni + 1);
2008-01-07 14:51:07 +00:00
}
newTable->setBodyElement(t, 0, newIndex);
return newTable;
} else {
return 0;
2008-01-07 14:51:07 +00:00
}
}
2014-07-11 15:47:57 +00:00
GcLineNumberTable* translateLineNumberTable(MyThread* t,
Context* context,
intptr_t start)
2008-01-07 14:51:07 +00:00
{
2014-06-29 04:57:07 +00:00
GcLineNumberTable* oldTable = context->method->code()->lineNumberTable();
2008-01-07 14:51:07 +00:00
if (oldTable) {
PROTECT(t, oldTable);
2014-06-29 04:57:07 +00:00
unsigned length = oldTable->length();
GcLineNumberTable* newTable = makeLineNumberTable(t, length);
unsigned ni = 0;
for (unsigned oi = 0; oi < length; ++oi) {
2014-06-29 04:57:07 +00:00
uint64_t oldLine = oldTable->body()[oi];
2014-07-11 15:47:57 +00:00
int ip = resolveIpForwards(
context,
lineNumberIp(oldLine),
oi + 1 < length ? lineNumberIp(oldTable->body()[oi + 1]) - 1
: lineNumberIp(oldLine) + 1);
2008-01-07 14:51:07 +00:00
if (LIKELY(ip >= 0)) {
2014-07-11 15:47:57 +00:00
newTable->body()[ni++]
= lineNumber(context->compiler->machineIp(ip)->value() - start,
lineNumberLine(oldLine));
}
}
2008-01-07 14:51:07 +00:00
if (UNLIKELY(ni < length)) {
newTable = truncateLineNumberTable(t, newTable, ni);
2008-01-07 14:51:07 +00:00
}
return newTable;
} else {
return 0;
2008-01-07 14:51:07 +00:00
}
}
2014-07-11 15:50:18 +00:00
void printSet(uintptr_t* m, unsigned limit)
{
if (limit) {
for (unsigned i = 0; i < 32; ++i) {
if ((*m >> i) & 1) {
fprintf(stderr, "1");
} else {
fprintf(stderr, "_");
}
}
}
}
2014-07-11 15:50:18 +00:00
void calculateTryCatchRoots(Context* context,
uintptr_t* roots,
unsigned mapSize,
unsigned start,
unsigned end)
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
{
memset(roots, 0xFF, mapSize * BytesPerWord);
if (DebugFrameMaps) {
fprintf(stderr, "calculate try/catch roots from %d to %d\n", start, end);
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
}
for (TraceElement* te = context->traceLog; te; te = te->next) {
if (te->ip >= start and te->ip < end) {
uintptr_t* traceRoots = 0;
traceRoots = te->map;
te->watch = true;
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
if (traceRoots) {
if (DebugFrameMaps) {
fprintf(stderr, " use roots at ip %3d: ", te->ip);
printSet(traceRoots, mapSize);
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
fprintf(stderr, "\n");
}
for (unsigned wi = 0; wi < mapSize; ++wi) {
roots[wi] &= traceRoots[wi];
}
} else {
if (DebugFrameMaps) {
fprintf(stderr, " skip roots at ip %3d\n", te->ip);
}
}
}
}
if (DebugFrameMaps) {
fprintf(stderr, "result roots : ");
printSet(roots, mapSize);
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
fprintf(stderr, "\n");
}
}
unsigned calculateFrameMaps(MyThread* t,
Context* context,
uintptr_t* originalRoots,
unsigned eventIndex,
uintptr_t* resultRoots)
2008-01-07 14:51:07 +00:00
{
// for each instruction with more than one predecessor, and for each
// stack position, determine if there exists a path to that
// instruction such that there is not an object pointer left at that
// stack position (i.e. it is uninitialized or contains primitive
// data).
2008-01-07 14:51:07 +00:00
unsigned mapSize = frameMapSizeInWords(t, context->method);
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RUNTIME_ARRAY(t, uintptr_t, roots, mapSize);
if (originalRoots) {
memcpy(RUNTIME_ARRAY_BODY(roots), originalRoots, mapSize * BytesPerWord);
} else {
memset(RUNTIME_ARRAY_BODY(roots), 0, mapSize * BytesPerWord);
}
2008-01-07 14:51:07 +00:00
int32_t ip = -1;
// invariant: for each stack position, roots contains a zero at that
// position if there exists some path to the current instruction
// such that there is definitely not an object pointer at that
// position. Otherwise, roots contains a one at that position,
// meaning either all known paths result in an object pointer at
// that position, or the contents of that position are as yet
// unknown.
unsigned length = context->eventLog.length();
while (eventIndex < length) {
Event e = static_cast<Event>(context->eventLog.get(eventIndex++));
2008-01-07 14:51:07 +00:00
switch (e) {
2008-07-05 20:21:13 +00:00
case PushContextEvent: {
eventIndex = calculateFrameMaps(t,
context,
RUNTIME_ARRAY_BODY(roots),
eventIndex, /*subroutinePath,*/
resultRoots);
2008-01-07 14:51:07 +00:00
} break;
2008-07-05 20:21:13 +00:00
case PopContextEvent:
goto exit;
2008-01-07 14:51:07 +00:00
case IpEvent: {
ip = context->eventLog.get2(eventIndex);
eventIndex += 2;
2008-01-07 14:51:07 +00:00
if (DebugFrameMaps) {
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
fprintf(stderr, " roots at ip %3d: ", ip);
printSet(RUNTIME_ARRAY_BODY(roots), mapSize);
fprintf(stderr, "\n");
}
assertT(context->thread, ip * mapSize <= context->rootTable.count);
uintptr_t* tableRoots = context->rootTable.begin() + (ip * mapSize);
2008-01-07 14:51:07 +00:00
if (context->visitTable[ip] > 1) {
for (unsigned wi = 0; wi < mapSize; ++wi) {
uintptr_t newRoots = tableRoots[wi] & RUNTIME_ARRAY_BODY(roots)[wi];
if ((eventIndex == length
2008-07-05 20:21:13 +00:00
or context->eventLog.get(eventIndex) == PopContextEvent)
2014-07-11 15:50:18 +00:00
and newRoots != tableRoots[wi]) {
if (DebugFrameMaps) {
fprintf(stderr, "dirty roots!\n");
}
context->dirtyRoots = true;
}
tableRoots[wi] = newRoots;
RUNTIME_ARRAY_BODY(roots)[wi] &= tableRoots[wi];
2008-01-07 14:51:07 +00:00
}
if (DebugFrameMaps) {
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
fprintf(stderr, " table roots at ip %3d: ", ip);
printSet(tableRoots, mapSize);
fprintf(stderr, "\n");
}
} else {
memcpy(tableRoots, RUNTIME_ARRAY_BODY(roots), mapSize * BytesPerWord);
2008-01-07 14:51:07 +00:00
}
} break;
case MarkEvent: {
unsigned i = context->eventLog.get2(eventIndex);
eventIndex += 2;
2008-01-07 14:51:07 +00:00
markBit(RUNTIME_ARRAY_BODY(roots), i);
2008-01-07 14:51:07 +00:00
} break;
case ClearEvent: {
unsigned i = context->eventLog.get2(eventIndex);
eventIndex += 2;
clearBit(RUNTIME_ARRAY_BODY(roots), i);
2008-01-07 14:51:07 +00:00
} break;
case PushExceptionHandlerEvent: {
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
unsigned start = context->eventLog.get2(eventIndex);
eventIndex += 2;
unsigned end = context->eventLog.get2(eventIndex);
eventIndex += 2;
calculateTryCatchRoots(
context, RUNTIME_ARRAY_BODY(roots), mapSize, start, end);
eventIndex = calculateFrameMaps(
t, context, RUNTIME_ARRAY_BODY(roots), eventIndex, 0);
} break;
2008-01-07 14:51:07 +00:00
case TraceEvent: {
2014-07-11 15:50:18 +00:00
TraceElement* te;
context->eventLog.get(eventIndex, &te, BytesPerWord);
if (DebugFrameMaps) {
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
fprintf(stderr, " trace roots at ip %3d: ", ip);
printSet(RUNTIME_ARRAY_BODY(roots), mapSize);
fprintf(stderr, "\n");
}
2014-05-29 04:17:25 +00:00
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
uintptr_t* map;
bool watch;
map = te->map;
watch = te->watch;
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
for (unsigned wi = 0; wi < mapSize; ++wi) {
uintptr_t v = RUNTIME_ARRAY_BODY(roots)[wi];
if (watch and map[wi] != v) {
if (DebugFrameMaps) {
fprintf(stderr, "dirty roots due to trace watch!\n");
}
context->dirtyRoots = true;
}
map[wi] = v;
}
eventIndex += BytesPerWord;
2008-01-07 14:51:07 +00:00
} break;
2014-07-11 15:50:18 +00:00
default:
abort(t);
2008-01-07 14:51:07 +00:00
}
}
2014-07-11 15:50:18 +00:00
exit:
if (resultRoots and ip != -1) {
if (DebugFrameMaps) {
fprintf(stderr, "result roots at ip %3d: ", ip);
printSet(RUNTIME_ARRAY_BODY(roots), mapSize);
fprintf(stderr, "\n");
}
memcpy(resultRoots, RUNTIME_ARRAY_BODY(roots), mapSize * BytesPerWord);
}
return eventIndex;
2008-01-07 14:51:07 +00:00
}
2014-07-11 15:50:18 +00:00
int compareTraceElementPointers(const void* va, const void* vb)
{
TraceElement* a = *static_cast<TraceElement* const*>(va);
TraceElement* b = *static_cast<TraceElement* const*>(vb);
if (a->address->value() > b->address->value()) {
return 1;
} else if (a->address->value() < b->address->value()) {
return -1;
} else {
return 0;
}
}
2014-07-11 15:50:18 +00:00
uint8_t* finish(MyThread* t,
FixedAllocator* allocator,
avian::codegen::Assembler* a,
const char* name,
unsigned length)
2008-02-11 17:21:41 +00:00
{
2014-07-11 15:50:18 +00:00
uint8_t* start
= static_cast<uint8_t*>(allocator->allocate(length, TargetBytesPerWord));
2007-10-04 22:41:19 +00:00
a->setDestination(start);
a->write();
2007-10-04 22:41:19 +00:00
logCompile(t, start, length, 0, name, 0);
2007-10-04 22:41:19 +00:00
2008-11-23 23:58:01 +00:00
return start;
2008-02-11 17:21:41 +00:00
}
2007-10-12 14:26:36 +00:00
2014-07-11 15:50:18 +00:00
void setBit(int32_t* dst, unsigned index)
{
dst[index / 32] |= static_cast<int32_t>(1) << (index % 32);
}
2014-07-11 15:50:18 +00:00
void clearBit(int32_t* dst, unsigned index)
{
dst[index / 32] &= ~(static_cast<int32_t>(1) << (index % 32));
}
void copyFrameMap(int32_t* dst,
uintptr_t* src,
unsigned mapSizeInBits,
unsigned offset,
2014-06-01 16:04:56 +00:00
TraceElement* p)
{
if (DebugFrameMaps) {
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
fprintf(stderr, " orig roots at ip %3d: ", p->ip);
2013-02-11 01:06:15 +00:00
printSet(src, ceilingDivide(mapSizeInBits, BitsPerWord));
fprintf(stderr, "\n");
fix stack frame mapping code for exception handlers Previously, the stack frame mapping code (responsible for statically calculating the map of GC roots for a method's stack frame during JIT compilation) would assume that the map of GC roots on entry to an exception handler is the same as on entry to the "try" block which the handler is attached to. Technically, this is true, but the algorithm we use does not consider whether a local variable is still "live" (i.e. will be read later) when calculating the map - only whether we can expect to find a reference there via normal (non-exceptional) control flow. This can backfire if, within a "try" block, the stack location which held an object reference on entry to the block gets overwritten with a non-reference (i.e. a primitive). If an exception is later thrown from such a block, we might end up trying to treat that non-reference as a reference during GC, which will crash the VM. The ideal way to fix this is to calculate the true interval for which each value is live and use that to produce the stack frame maps. This would provide the added benefit of ensuring that the garbage collector does not visit references which, although still present on the stack, will not be used again. However, this commit uses the less invasive strategy of ANDing together the root maps at each GC point within a "try" block and using the result as the map on entry to the corresponding exception handler(s). This should give us safe, if not optimal, results. Later on, we can refine it as described above.
2010-02-05 01:03:32 +00:00
fprintf(stderr, " final roots at ip %3d: ", p->ip);
}
for (unsigned j = 0; j < p->argumentIndex; ++j) {
if (getBit(src, j)) {
if (DebugFrameMaps) {
fprintf(stderr, "1");
}
setBit(dst, offset + j);
} else {
if (DebugFrameMaps) {
fprintf(stderr, "_");
}
clearBit(dst, offset + j);
}
}
if (DebugFrameMaps) {
fprintf(stderr, "\n");
}
}
class FrameMapTableHeader {
public:
2014-07-11 15:50:18 +00:00
FrameMapTableHeader(unsigned indexCount) : indexCount(indexCount)
{
}
unsigned indexCount;
};
class FrameMapTableIndexElement {
public:
2014-07-11 15:50:18 +00:00
FrameMapTableIndexElement(int offset, unsigned base, unsigned path)
: offset(offset), base(base), path(path)
{
}
int offset;
unsigned base;
unsigned path;
};
class FrameMapTablePath {
public:
2014-07-11 15:50:18 +00:00
FrameMapTablePath(unsigned stackIndex, unsigned elementCount, unsigned next)
: stackIndex(stackIndex), elementCount(elementCount), next(next)
{
}
unsigned stackIndex;
unsigned elementCount;
unsigned next;
int32_t elements[0];
};
2014-07-11 15:47:57 +00:00
GcIntArray* makeSimpleFrameMapTable(MyThread* t,
Context* context,
uint8_t* start,
TraceElement** elements,
unsigned elementCount)
{
unsigned mapSize = frameMapSizeInBits(t, context->method);
2014-07-11 15:47:57 +00:00
GcIntArray* table = makeIntArray(
t, elementCount + ceilingDivide(elementCount * mapSize, 32));
2014-07-11 15:47:57 +00:00
assertT(t,
table->length()
== elementCount + simpleFrameMapTableSize(t, context->method, table));
for (unsigned i = 0; i < elementCount; ++i) {
TraceElement* p = elements[i];
2014-06-29 04:57:07 +00:00
table->body()[i] = static_cast<intptr_t>(p->address->value())
2014-07-11 15:47:57 +00:00
- reinterpret_cast<intptr_t>(start);
2014-07-11 15:47:57 +00:00
assertT(
t,
elementCount + ceilingDivide((i + 1) * mapSize, 32) <= table->length());
if (mapSize) {
2014-07-11 15:47:57 +00:00
copyFrameMap(
&table->body()[elementCount], p->map, mapSize, i * mapSize, p);
}
}
return table;
}
2009-10-20 14:20:49 +00:00
void insertCallNode(MyThread* t, GcCallNode* node);
2014-07-11 15:50:18 +00:00
void finish(MyThread* t, FixedAllocator* allocator, Context* context)
2008-02-11 17:21:41 +00:00
{
avian::codegen::Compiler* c = context->compiler;
if (false) {
2014-07-11 15:47:57 +00:00
logCompile(
t,
0,
0,
reinterpret_cast<const char*>(
context->method->class_()->name()->body().begin()),
reinterpret_cast<const char*>(context->method->name()->body().begin()),
reinterpret_cast<const char*>(context->method->spec()->body().begin()));
}
// for debugging:
2014-07-11 15:47:57 +00:00
if (false
and ::strcmp(reinterpret_cast<const char*>(
context->method->class_()->name()->body().begin()),
"java/lang/System") == 0
and ::strcmp(reinterpret_cast<const char*>(
context->method->name()->body().begin()),
"<clinit>") == 0) {
trap();
}
// todo: this is a CPU-intensive operation, so consider doing it
// earlier before we've acquired the global class lock to improve
// parallelism (the downside being that it may end up being a waste
// of cycles if another thread compiles the same method in parallel,
// which might be mitigated by fine-grained, per-method locking):
c->compile(context->leaf ? 0 : stackOverflowThunk(t),
TARGET_THREAD_STACKLIMIT);
// we must acquire the class lock here at the latest
2014-02-25 22:46:35 +00:00
unsigned codeSize = c->resolve(allocator->memory.begin() + allocator->offset);
unsigned total = pad(codeSize, TargetBytesPerWord)
2014-07-11 15:50:18 +00:00
+ pad(c->poolSize(), TargetBytesPerWord);
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
2014-07-11 15:50:18 +00:00
target_uintptr_t* code = static_cast<target_uintptr_t*>(
allocator->allocate(total, TargetBytesPerWord));
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
uint8_t* start = reinterpret_cast<uint8_t*>(code);
2008-11-23 23:58:01 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
context->executableAllocator = allocator;
context->executableStart = code;
context->executableSize = total;
2008-11-23 23:58:01 +00:00
if (context->objectPool) {
2014-07-11 15:47:57 +00:00
object pool = allocate3(
t,
allocator,
Machine::ImmortalAllocation,
GcArray::FixedSize + ((context->objectPoolCount + 1) * BytesPerWord),
true);
2008-11-23 23:58:01 +00:00
2014-02-25 22:46:35 +00:00
context->executableSize = (allocator->memory.begin() + allocator->offset)
- static_cast<uint8_t*>(context->executableStart);
2014-07-11 15:47:57 +00:00
initArray(
t, reinterpret_cast<GcArray*>(pool), context->objectPoolCount + 1);
mark(t, pool, 0);
2008-11-23 23:58:01 +00:00
2014-06-26 02:17:27 +00:00
setField(t, pool, ArrayBody, compileRoots(t)->objectPools());
2014-06-25 20:38:13 +00:00
compileRoots(t)->setObjectPools(t, pool);
2008-11-23 23:58:01 +00:00
unsigned i = 1;
for (PoolElement* p = context->objectPool; p; p = p->next) {
unsigned offset = ArrayBody + ((i++) * BytesPerWord);
2008-11-23 23:58:01 +00:00
p->address = reinterpret_cast<uintptr_t>(pool) + offset;
2014-06-26 02:17:27 +00:00
setField(t, pool, offset, p->target);
2008-11-23 23:58:01 +00:00
}
}
c->write();
BootContext* bc = context->bootContext;
if (bc) {
for (avian::codegen::DelayedPromise* p = bc->addresses;
p != bc->addressSentinal;
2014-07-11 15:50:18 +00:00
p = p->next) {
p->basis = new (bc->zone)
avian::codegen::ResolvedPromise(p->basis->value());
}
}
2014-07-11 15:47:57 +00:00
{
GcArray* newExceptionHandlerTable = translateExceptionHandlerTable(
t,
context,
reinterpret_cast<intptr_t>(start),
reinterpret_cast<intptr_t>(start) + codeSize);
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
PROTECT(t, newExceptionHandlerTable);
2014-07-11 15:47:57 +00:00
GcLineNumberTable* newLineNumberTable = translateLineNumberTable(
t, context, reinterpret_cast<intptr_t>(start));
2014-06-29 04:57:07 +00:00
GcCode* code = context->method->code();
2008-04-11 21:00:18 +00:00
2014-07-11 15:47:57 +00:00
code = makeCode(t,
0,
0,
newExceptionHandlerTable,
newLineNumberTable,
reinterpret_cast<uintptr_t>(start),
codeSize,
code->maxStack(),
code->maxLocals(),
0);
2014-06-25 20:38:13 +00:00
context->method->setCode(t, code);
2008-02-11 17:21:41 +00:00
}
if (context->traceLogCount) {
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RUNTIME_ARRAY(t, TraceElement*, elements, context->traceLogCount);
unsigned index = 0;
// unsigned pathFootprint = 0;
// unsigned mapCount = 0;
for (TraceElement* p = context->traceLog; p; p = p->next) {
assertT(t, index < context->traceLogCount);
2008-04-11 21:00:18 +00:00
if (p->address) {
RUNTIME_ARRAY_BODY(elements)[index++] = p;
if (p->target) {
2014-07-11 15:50:18 +00:00
insertCallNode(
t, makeCallNode(t, p->address->value(), p->target, p->flags, 0));
}
2007-12-09 22:45:43 +00:00
}
}
2014-07-11 15:50:18 +00:00
qsort(RUNTIME_ARRAY_BODY(elements),
index,
sizeof(TraceElement*),
compareTraceElementPointers);
2014-06-29 04:57:07 +00:00
GcIntArray* map = makeSimpleFrameMapTable(
2014-06-01 16:04:56 +00:00
t, context, start, RUNTIME_ARRAY_BODY(elements), index);
2014-06-25 20:38:13 +00:00
context->method->code()->setStackMap(t, map);
}
2014-07-11 15:47:57 +00:00
logCompile(
t,
start,
codeSize,
reinterpret_cast<const char*>(
context->method->class_()->name()->body().begin()),
reinterpret_cast<const char*>(context->method->name()->body().begin()),
reinterpret_cast<const char*>(context->method->spec()->body().begin()));
2008-02-11 17:21:41 +00:00
// for debugging:
2014-07-11 15:47:57 +00:00
if (false
and ::strcmp(reinterpret_cast<const char*>(
context->method->class_()->name()->body().begin()),
"java/lang/System") == 0
and ::strcmp(reinterpret_cast<const char*>(
context->method->name()->body().begin()),
"<clinit>") == 0) {
trap();
2007-12-09 22:45:43 +00:00
}
syncInstructionCache(start, codeSize);
2007-12-09 22:45:43 +00:00
}
2007-09-30 02:48:27 +00:00
2014-07-11 15:50:18 +00:00
void compile(MyThread* t, Context* context)
2007-12-09 22:45:43 +00:00
{
avian::codegen::Compiler* c = context->compiler;
2007-09-30 02:48:27 +00:00
if (false) {
fprintf(stderr,
"compiling %s.%s%s\n",
context->method->class_()->name()->body().begin(),
context->method->name()->body().begin(),
context->method->spec()->body().begin());
}
2014-05-29 04:17:25 +00:00
unsigned footprint = context->method->parameterFootprint();
unsigned locals = localSize(t, context->method);
2014-07-11 15:47:57 +00:00
c->init(context->method->code()->length(),
footprint,
locals,
alignedFrameSize(t, context->method));
2007-09-30 02:48:27 +00:00
2014-07-11 15:47:57 +00:00
ir::Type* stackMap = (ir::Type*)malloc(sizeof(ir::Type)
* context->method->code()->maxStack());
2014-05-05 16:49:50 +00:00
Frame frame(context, stackMap);
2007-09-30 02:48:27 +00:00
2014-05-29 04:17:25 +00:00
unsigned index = context->method->parameterFootprint();
if ((context->method->flags() & ACC_STATIC) == 0) {
2014-06-01 20:22:14 +00:00
frame.set(--index, ir::Type::object());
c->initLocal(index, ir::Type::object());
2008-01-07 14:51:07 +00:00
}
2014-07-11 15:47:57 +00:00
for (MethodSpecIterator it(t,
reinterpret_cast<const char*>(
context->method->spec()->body().begin()));
it.hasNext();) {
2008-01-07 14:51:07 +00:00
switch (*it.next()) {
case 'L':
case '[':
2014-06-01 20:22:14 +00:00
frame.set(--index, ir::Type::object());
c->initLocal(index, ir::Type::object());
2008-01-07 14:51:07 +00:00
break;
2014-05-01 03:35:08 +00:00
2008-01-07 14:51:07 +00:00
case 'J':
2014-06-01 20:22:14 +00:00
frame.set(--index, ir::Type::i8());
frame.set(--index, ir::Type::i8());
c->initLocal(index, ir::Type::i8());
break;
2009-11-30 15:08:45 +00:00
2008-01-07 14:51:07 +00:00
case 'D':
2014-06-01 20:22:14 +00:00
frame.set(--index, ir::Type::f8());
frame.set(--index, ir::Type::f8());
c->initLocal(index, ir::Type::f8());
2008-01-07 14:51:07 +00:00
break;
2014-05-01 03:35:08 +00:00
case 'F':
2014-06-01 20:22:14 +00:00
frame.set(--index, ir::Type::i4());
c->initLocal(index, ir::Type::f4());
break;
2014-05-01 03:35:08 +00:00
2008-01-07 14:51:07 +00:00
default:
2014-06-01 20:22:14 +00:00
frame.set(--index, ir::Type::i4());
c->initLocal(index, ir::Type::i4());
2008-01-07 14:51:07 +00:00
break;
}
}
handleEntrance(t, &frame);
Compiler::State* state = c->saveState();
2007-12-09 22:45:43 +00:00
compile(t, &frame, 0);
2007-09-30 02:48:27 +00:00
context->dirtyRoots = false;
unsigned eventIndex = calculateFrameMaps(t, context, 0, 0, 0);
2008-01-07 14:51:07 +00:00
2014-07-11 15:47:57 +00:00
GcExceptionHandlerTable* eht = cast<GcExceptionHandlerTable>(
t, context->method->code()->exceptionHandlerTable());
2007-12-09 22:45:43 +00:00
if (eht) {
PROTECT(t, eht);
2007-09-30 02:48:27 +00:00
2014-06-29 04:57:07 +00:00
unsigned visitCount = eht->length();
2009-03-08 01:23:28 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RUNTIME_ARRAY(t, bool, visited, visitCount);
memset(RUNTIME_ARRAY_BODY(visited), 0, visitCount * sizeof(bool));
bool progress = true;
while (progress) {
progress = false;
for (unsigned subI = 0; subI <= context->subroutineCount; ++subI) {
2014-07-11 15:47:57 +00:00
unsigned duplicatedBaseIp = subI * context->method->code()->length();
2014-06-29 04:57:07 +00:00
for (unsigned i = 0; i < eht->length(); ++i) {
uint64_t eh = eht->body()[i];
int start
= resolveIpForwards(context,
duplicatedBaseIp + exceptionHandlerStart(eh),
duplicatedBaseIp + exceptionHandlerEnd(eh));
2014-07-11 15:50:18 +00:00
if ((not RUNTIME_ARRAY_BODY(visited)[i]) and start >= 0
and context->visitTable[start]) {
RUNTIME_ARRAY_BODY(visited)[i] = true;
progress = true;
2007-09-30 02:48:27 +00:00
c->restoreState(state);
2008-01-07 14:51:07 +00:00
2014-05-05 16:49:50 +00:00
ir::Type* stackMap = (ir::Type*)malloc(
2014-07-11 15:47:57 +00:00
sizeof(ir::Type) * context->method->code()->maxStack());
2014-05-05 16:49:50 +00:00
Frame frame2(&frame, stackMap);
unsigned end = duplicatedBaseIp + exceptionHandlerEnd(eh);
if (exceptionHandlerIp(eh) >= static_cast<unsigned>(start)
and exceptionHandlerIp(eh) < end) {
end = duplicatedBaseIp + exceptionHandlerIp(eh);
}
context->eventLog.append(PushExceptionHandlerEvent);
context->eventLog.append2(start);
context->eventLog.append2(end);
2014-07-11 15:47:57 +00:00
for (unsigned i = 1; i < context->method->code()->maxStack(); ++i) {
2014-06-01 20:22:14 +00:00
frame2.set(localSize(t, context->method) + i, ir::Type::i4());
}
compile(t, &frame2, exceptionHandlerIp(eh), start);
context->eventLog.append(PopContextEvent);
eventIndex = calculateFrameMaps(t, context, 0, eventIndex, 0);
}
}
}
2007-12-09 22:45:43 +00:00
}
}
2007-09-30 02:48:27 +00:00
while (context->dirtyRoots) {
context->dirtyRoots = false;
calculateFrameMaps(t, context, 0, 0, 0);
}
2014-05-05 16:49:50 +00:00
free(stackMap);
2007-12-09 22:45:43 +00:00
}
#endif // not AVIAN_AOT_ONLY
2007-09-30 02:48:27 +00:00
2014-07-11 15:50:18 +00:00
void updateCall(MyThread* t,
avian::codegen::lir::UnaryOperation op,
void* returnAddress,
void* target)
{
t->arch->updateCall(op, returnAddress, target);
2007-12-09 22:45:43 +00:00
}
2007-09-30 02:48:27 +00:00
2014-07-11 15:50:18 +00:00
void* compileMethod2(MyThread* t, void* ip);
2007-09-30 02:48:27 +00:00
2014-07-11 15:50:18 +00:00
uint64_t compileMethod(MyThread* t)
2007-12-16 22:41:07 +00:00
{
void* ip;
if (t->tailAddress) {
ip = t->tailAddress;
t->tailAddress = 0;
} else {
ip = getIp(t);
}
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
return reinterpret_cast<uintptr_t>(compileMethod2(t, ip));
}
2014-07-11 15:47:57 +00:00
void* compileVirtualMethod2(MyThread* t, GcClass* class_, unsigned index)
{
// If class_ has BootstrapFlag set, that means its vtable is not yet
// available. However, we must set t->trace->targetMethod to an
// appropriate method to ensure we can accurately scan the stack for
// GC roots. We find such a method by looking for a superclass with
// a vtable and using it instead:
2014-06-29 04:57:07 +00:00
GcClass* c = class_;
while (c->vmFlags() & BootstrapFlag) {
c = c->super();
}
2014-07-11 15:47:57 +00:00
t->trace->targetMethod
= cast<GcMethod>(t, cast<GcArray>(t, c->virtualTable())->body()[index]);
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RESOURCE0(t, static_cast<MyThread*>(t)->trace->targetMethod = 0;);
PROTECT(t, class_);
2014-05-29 04:17:25 +00:00
GcMethod* target = resolveTarget(t, class_, index);
PROTECT(t, target);
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
compile(t, codeAllocator(t), 0, target);
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
void* address = reinterpret_cast<void*>(methodAddress(t, target));
2014-05-29 04:17:25 +00:00
if (target->flags() & ACC_NATIVE) {
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
t->trace->nativeMethod = target;
} else {
2014-06-29 04:57:07 +00:00
class_->vtable()[target->offset()] = address;
}
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
return address;
}
2014-07-11 15:50:18 +00:00
uint64_t compileVirtualMethod(MyThread* t)
{
2014-05-29 04:17:25 +00:00
GcClass* class_ = objectClass(t, static_cast<object>(t->virtualCallTarget));
2009-05-03 20:57:11 +00:00
t->virtualCallTarget = 0;
unsigned index = t->virtualCallIndex;
t->virtualCallIndex = 0;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
return reinterpret_cast<uintptr_t>(compileVirtualMethod2(t, class_, index));
}
2014-07-11 15:47:57 +00:00
uint64_t invokeNativeFast(MyThread* t, GcMethod* method, void* function)
2009-05-03 20:57:11 +00:00
{
2014-07-11 15:50:18 +00:00
FastNativeFunction f;
memcpy(&f, &function, sizeof(void*));
return f(t,
method,
static_cast<uintptr_t*>(t->stack) + t->arch->frameFooterSize()
2010-11-12 23:53:16 +00:00
+ t->arch->frameReturnAddressSize());
2009-05-03 20:57:11 +00:00
}
2014-07-11 15:47:57 +00:00
uint64_t invokeNativeSlow(MyThread* t, GcMethod* method, void* function)
2007-12-09 22:45:43 +00:00
{
PROTECT(t, method);
2014-05-29 04:17:25 +00:00
unsigned footprint = method->parameterFootprint() + 1;
if (method->flags() & ACC_STATIC) {
2014-07-11 15:50:18 +00:00
++footprint;
2007-12-09 22:45:43 +00:00
}
2014-05-29 04:17:25 +00:00
unsigned count = method->parameterCount() + 2;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RUNTIME_ARRAY(t, uintptr_t, args, footprint);
2007-12-09 22:45:43 +00:00
unsigned argOffset = 0;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RUNTIME_ARRAY(t, uint8_t, types, count);
2007-12-09 22:45:43 +00:00
unsigned typeOffset = 0;
2007-09-30 02:48:27 +00:00
RUNTIME_ARRAY_BODY(args)[argOffset++] = reinterpret_cast<uintptr_t>(t);
RUNTIME_ARRAY_BODY(types)[typeOffset++] = POINTER_TYPE;
2014-07-11 15:50:18 +00:00
uintptr_t* sp = static_cast<uintptr_t*>(t->stack) + t->arch->frameFooterSize()
+ t->arch->frameReturnAddressSize();
GcJclass* jclass = 0;
PROTECT(t, jclass);
2014-05-29 04:17:25 +00:00
if (method->flags() & ACC_STATIC) {
jclass = getJClass(t, method->class_());
RUNTIME_ARRAY_BODY(args)[argOffset++]
2014-07-11 15:50:18 +00:00
= reinterpret_cast<uintptr_t>(&jclass);
2007-12-09 22:45:43 +00:00
} else {
2014-07-11 15:50:18 +00:00
RUNTIME_ARRAY_BODY(args)[argOffset++] = reinterpret_cast<uintptr_t>(sp++);
2007-12-09 22:45:43 +00:00
}
RUNTIME_ARRAY_BODY(types)[typeOffset++] = POINTER_TYPE;
2014-07-11 15:47:57 +00:00
MethodSpecIterator it(
t, reinterpret_cast<const char*>(method->spec()->body().begin()));
2014-05-29 04:17:25 +00:00
2007-12-09 22:45:43 +00:00
while (it.hasNext()) {
unsigned type = RUNTIME_ARRAY_BODY(types)[typeOffset++]
2014-07-11 15:50:18 +00:00
= fieldType(t, fieldCode(t, *it.next()));
2007-12-09 22:45:43 +00:00
switch (type) {
case INT8_TYPE:
case INT16_TYPE:
case INT32_TYPE:
case FLOAT_TYPE:
RUNTIME_ARRAY_BODY(args)[argOffset++] = *(sp++);
2007-12-09 22:45:43 +00:00
break;
2007-12-09 22:45:43 +00:00
case INT64_TYPE:
case DOUBLE_TYPE: {
memcpy(RUNTIME_ARRAY_BODY(args) + argOffset, sp, 8);
2007-12-18 02:09:32 +00:00
argOffset += (8 / BytesPerWord);
2009-05-03 20:57:11 +00:00
sp += 2;
2007-12-09 22:45:43 +00:00
} break;
2007-12-09 22:45:43 +00:00
case POINTER_TYPE: {
if (*sp) {
2014-07-11 15:50:18 +00:00
RUNTIME_ARRAY_BODY(args)[argOffset++] = reinterpret_cast<uintptr_t>(sp);
} else {
RUNTIME_ARRAY_BODY(args)[argOffset++] = 0;
}
2014-07-11 15:50:18 +00:00
++sp;
2007-12-09 22:45:43 +00:00
} break;
2014-07-11 15:50:18 +00:00
default:
abort(t);
2007-10-03 00:22:48 +00:00
}
}
2014-05-29 04:17:25 +00:00
unsigned returnCode = method->returnCode();
unsigned returnType = fieldType(t, returnCode);
2007-12-09 22:45:43 +00:00
uint64_t result;
if (DebugNatives) {
2014-07-11 15:47:57 +00:00
fprintf(stderr,
"invoke native method %s.%s\n",
method->class_()->name()->body().begin(),
method->name()->body().begin());
2007-12-09 22:45:43 +00:00
}
2007-10-04 00:41:54 +00:00
2014-05-29 04:17:25 +00:00
if (method->flags() & ACC_SYNCHRONIZED) {
if (method->flags() & ACC_STATIC) {
acquire(t, method->class_());
} else {
acquire(t, *reinterpret_cast<object*>(RUNTIME_ARRAY_BODY(args)[1]));
}
}
Reference* reference = t->reference;
2014-07-11 15:50:18 +00:00
{
ENTER(t, Thread::IdleState);
2007-10-03 00:22:48 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
bool noThrow = t->checkpoint->noThrow;
t->checkpoint->noThrow = true;
THREAD_RESOURCE(t, bool, noThrow, t->checkpoint->noThrow = noThrow);
result = vm::dynamicCall(function,
RUNTIME_ARRAY_BODY(args),
RUNTIME_ARRAY_BODY(types),
count,
footprint * BytesPerWord,
returnType);
}
2007-09-25 23:53:11 +00:00
2014-05-29 04:17:25 +00:00
if (method->flags() & ACC_SYNCHRONIZED) {
if (method->flags() & ACC_STATIC) {
release(t, method->class_());
} else {
release(t, *reinterpret_cast<object*>(RUNTIME_ARRAY_BODY(args)[1]));
}
}
if (DebugNatives) {
2014-07-11 15:47:57 +00:00
fprintf(stderr,
"return from native method %s.%s\n",
method->class_()->name()->body().begin(),
method->name()->body().begin());
2007-10-03 00:22:48 +00:00
}
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
if (UNLIKELY(t->exception)) {
2014-06-28 23:24:24 +00:00
GcThrowable* exception = t->exception;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
t->exception = 0;
vm::throw_(t, exception);
}
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
switch (returnCode) {
case ByteField:
case BooleanField:
result = static_cast<int8_t>(result);
break;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
case CharField:
result = static_cast<uint16_t>(result);
break;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
case ShortField:
result = static_cast<int16_t>(result);
break;
2007-12-18 02:09:32 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
case FloatField:
case IntField:
result = static_cast<int32_t>(result);
break;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
case LongField:
case DoubleField:
break;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
case ObjectField:
2014-07-11 15:50:18 +00:00
result = static_cast<uintptr_t>(result)
? *reinterpret_cast<uintptr_t*>(static_cast<uintptr_t>(result))
: 0;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
break;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
case VoidField:
result = 0;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
break;
2014-07-11 15:50:18 +00:00
default:
abort(t);
2007-10-03 00:22:48 +00:00
}
while (t->reference != reference) {
dispose(t, t->reference);
}
return result;
2007-12-09 22:45:43 +00:00
}
2014-05-29 04:17:25 +00:00
2014-07-11 15:47:57 +00:00
uint64_t invokeNative2(MyThread* t, GcMethod* method)
2009-05-03 20:57:11 +00:00
{
2014-06-29 04:57:07 +00:00
GcNative* native = getMethodRuntimeData(t, method)->native();
if (native->fast()) {
return invokeNativeFast(t, method, native->function());
2009-05-03 20:57:11 +00:00
} else {
2014-06-29 04:57:07 +00:00
return invokeNativeSlow(t, method, native->function());
2009-05-03 20:57:11 +00:00
}
}
2007-12-09 22:45:43 +00:00
2014-07-11 15:50:18 +00:00
uint64_t invokeNative(MyThread* t)
2007-12-09 22:45:43 +00:00
{
if (t->trace->nativeMethod == 0) {
void* ip;
if (t->tailAddress) {
ip = t->tailAddress;
t->tailAddress = 0;
} else {
ip = getIp(t);
}
GcCallNode* node = findCallNode(t, ip);
GcMethod* target = node->target();
if (node->flags() & TraceElement::VirtualCall) {
2008-04-23 16:33:31 +00:00
target = resolveTarget(t, t->stack, target);
2008-04-01 17:37:59 +00:00
}
2008-04-23 16:33:31 +00:00
t->trace->nativeMethod = target;
}
2008-04-01 17:37:59 +00:00
assertT(t, t->tailAddress == 0);
uint64_t result = 0;
2007-10-03 00:22:48 +00:00
t->trace->targetMethod = t->trace->nativeMethod;
t->m->classpath->resolveNative(t, t->trace->nativeMethod);
2009-05-03 20:57:11 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
result = invokeNative2(t, t->trace->nativeMethod);
2007-10-03 00:22:48 +00:00
2014-05-29 04:17:25 +00:00
unsigned parameterFootprint = t->trace->targetMethod->parameterFootprint();
2009-05-17 00:39:08 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
uintptr_t* stack = static_cast<uintptr_t*>(t->stack);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
if (avian::codegen::TailCalls
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
and t->arch->argumentFootprint(parameterFootprint)
2014-07-11 15:50:18 +00:00
> t->arch->stackAlignmentInWords()) {
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
stack += t->arch->argumentFootprint(parameterFootprint)
2014-07-11 15:50:18 +00:00
- t->arch->stackAlignmentInWords();
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
}
2009-05-17 00:39:08 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
stack += t->arch->frameReturnAddressSize();
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
t->trace->targetMethod = 0;
t->trace->nativeMethod = 0;
t->newStack = stack;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
return result;
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:47:57 +00:00
void findFrameMapInSimpleTable(MyThread* t,
GcMethod* method,
GcIntArray* table,
int32_t offset,
int32_t** map,
unsigned* start)
{
unsigned tableSize = simpleFrameMapTableSize(t, method, table);
2014-06-29 04:57:07 +00:00
unsigned indexSize = table->length() - tableSize;
2014-06-29 04:57:07 +00:00
*map = &table->body()[indexSize];
2014-05-29 04:17:25 +00:00
unsigned bottom = 0;
unsigned top = indexSize;
for (unsigned span = top - bottom; span; span = top - bottom) {
unsigned middle = bottom + (span / 2);
2014-06-29 04:57:07 +00:00
int32_t v = table->body()[middle];
2014-05-29 04:17:25 +00:00
if (offset == v) {
*start = frameMapSizeInBits(t, method) * middle;
return;
} else if (offset < v) {
top = middle;
} else {
bottom = middle + 1;
}
}
abort(t);
}
2007-10-03 00:22:48 +00:00
2014-07-11 15:47:57 +00:00
void findFrameMap(MyThread* t,
void* stack UNUSED,
GcMethod* method,
int32_t offset,
int32_t** map,
unsigned* start)
{
2014-07-11 15:47:57 +00:00
findFrameMapInSimpleTable(
t, method, method->code()->stackMap(), offset, map, start);
}
2014-07-11 15:47:57 +00:00
void visitStackAndLocals(MyThread* t,
Heap::Visitor* v,
void* frame,
GcMethod* method,
void* ip)
2007-12-09 22:45:43 +00:00
{
unsigned count = frameMapSizeInBits(t, method);
2007-12-09 22:45:43 +00:00
if (count) {
void* stack = stackForFrame(t, frame, method);
int32_t* map;
unsigned offset;
2014-07-11 15:50:18 +00:00
findFrameMap(
t,
stack,
method,
difference(ip, reinterpret_cast<void*>(methodAddress(t, method))),
&map,
&offset);
2007-12-09 22:45:43 +00:00
for (unsigned i = 0; i < count; ++i) {
int j = offset + i;
if (map[j / 32] & (static_cast<int32_t>(1) << (j % 32))) {
2014-05-29 04:17:25 +00:00
v->visit(localObject(t, stack, method, i));
}
2007-09-25 23:53:11 +00:00
}
}
}
2014-07-11 15:50:18 +00:00
void visitArgument(MyThread* t, Heap::Visitor* v, void* stack, unsigned index)
{
2014-07-11 15:50:18 +00:00
v->visit(static_cast<object*>(stack) + index
+ t->arch->frameReturnAddressSize() + t->arch->frameFooterSize());
}
2014-07-11 15:47:57 +00:00
void visitArguments(MyThread* t,
Heap::Visitor* v,
void* stack,
GcMethod* method)
{
unsigned index = 0;
2014-05-29 04:17:25 +00:00
if ((method->flags() & ACC_STATIC) == 0) {
2009-05-15 02:08:01 +00:00
visitArgument(t, v, stack, index++);
}
2014-07-11 15:47:57 +00:00
for (MethodSpecIterator it(
t, reinterpret_cast<const char*>(method->spec()->body().begin()));
it.hasNext();) {
switch (*it.next()) {
case 'L':
case '[':
2009-05-15 02:08:01 +00:00
visitArgument(t, v, stack, index++);
break;
2014-05-29 04:17:25 +00:00
case 'J':
case 'D':
index += 2;
break;
default:
2014-07-11 15:50:18 +00:00
++index;
break;
}
}
}
2014-07-11 15:50:18 +00:00
void visitStack(MyThread* t, Heap::Visitor* v)
{
void* ip = getIp(t);
2008-08-17 19:32:40 +00:00
void* stack = t->stack;
2007-12-30 22:24:48 +00:00
2007-12-09 22:45:43 +00:00
MyThread::CallTrace* trace = t->trace;
2014-05-29 04:17:25 +00:00
GcMethod* targetMethod = (trace ? trace->targetMethod : 0);
GcMethod* target = targetMethod;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
bool mostRecent = true;
2007-12-09 22:45:43 +00:00
2007-12-16 22:41:07 +00:00
while (stack) {
2009-05-17 23:43:48 +00:00
if (targetMethod) {
visitArguments(t, v, stack, targetMethod);
targetMethod = 0;
}
2014-05-29 04:17:25 +00:00
GcMethod* method = methodForIp(t, ip);
if (method) {
PROTECT(t, method);
void* nextIp = ip;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
nextFrame(t, &nextIp, &stack, method, target, mostRecent);
2008-01-07 14:51:07 +00:00
visitStackAndLocals(t, v, stack, method, ip);
2007-12-09 22:45:43 +00:00
ip = nextIp;
target = method;
2007-12-09 22:45:43 +00:00
} else if (trace) {
2008-08-17 19:32:40 +00:00
stack = trace->stack;
ip = trace->ip;
2007-12-09 22:45:43 +00:00
trace = trace->next;
if (trace) {
targetMethod = trace->targetMethod;
target = targetMethod;
} else {
target = 0;
}
2007-12-09 22:45:43 +00:00
} else {
break;
}
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
mostRecent = false;
}
2007-12-09 22:45:43 +00:00
}
2014-07-11 15:47:57 +00:00
void walkContinuationBody(MyThread* t,
Heap::Walker* w,
GcContinuation* c,
int start)
2009-05-03 20:57:11 +00:00
{
2009-05-17 23:43:48 +00:00
const int BodyOffset = ContinuationBody / BytesPerWord;
2009-05-03 20:57:11 +00:00
2014-06-27 00:17:16 +00:00
GcMethod* method = t->m->heap->follow(c->method());
2009-05-17 23:43:48 +00:00
int count = frameMapSizeInBits(t, method);
2009-05-03 20:57:11 +00:00
if (count) {
2014-07-11 15:47:57 +00:00
int stack = BodyOffset + (c->framePointerOffset() / BytesPerWord)
- t->arch->framePointerOffset()
- stackOffsetFromFrame(t, method);
2009-05-17 23:43:48 +00:00
int first = stack + localOffsetFromStack(t, count - 1, method);
if (start > first) {
count -= start - first;
}
int32_t* map;
unsigned offset;
2014-07-11 15:47:57 +00:00
findFrameMap(t,
reinterpret_cast<uintptr_t*>(c) + stack,
method,
difference(c->address(),
reinterpret_cast<void*>(methodAddress(t, method))),
&map,
&offset);
2009-05-03 20:57:11 +00:00
2009-05-17 23:43:48 +00:00
for (int i = count - 1; i >= 0; --i) {
int j = offset + i;
if (map[j / 32] & (static_cast<int32_t>(1) << (j % 32))) {
2009-05-17 23:43:48 +00:00
if (not w->visit(stack + localOffsetFromStack(t, i, method))) {
2009-05-03 20:57:11 +00:00
return;
2009-05-17 23:43:48 +00:00
}
2009-05-03 20:57:11 +00:00
}
}
}
}
2014-07-11 15:47:57 +00:00
void callContinuation(MyThread* t,
GcContinuation* continuation,
object result,
GcThrowable* exception,
void* ip,
void* stack)
2009-05-23 22:15:06 +00:00
{
assertT(t, t->exception == 0);
2009-05-23 22:15:06 +00:00
if (exception) {
t->exception = exception;
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
MyThread::TraceContext c(t, ip, stack, continuation, t->trace);
void* frame;
findUnwindTarget(t, &ip, &frame, &stack, &continuation);
2009-05-23 22:15:06 +00:00
}
2009-05-25 04:27:50 +00:00
t->trace->nativeMethod = 0;
t->trace->targetMethod = 0;
2011-01-27 18:54:41 +00:00
popResources(t);
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
transition(t, ip, stack, continuation, t->trace);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
vmJump(ip, 0, stack, t, reinterpret_cast<uintptr_t>(result), 0);
2009-05-23 22:15:06 +00:00
}
2014-07-11 15:47:57 +00:00
int8_t* returnSpec(MyThread* t, GcMethod* method)
2009-05-23 22:15:06 +00:00
{
int8_t* s = method->spec()->body().begin();
2014-07-11 15:50:18 +00:00
while (*s and *s != ')')
++s;
2009-05-23 22:15:06 +00:00
expect(t, *s == ')');
return s + 1;
}
2014-07-11 15:47:57 +00:00
GcClass* returnClass(MyThread* t, GcMethod* method)
{
PROTECT(t, method);
int8_t* spec = returnSpec(t, method);
unsigned length = strlen(reinterpret_cast<char*>(spec));
2014-06-28 23:24:24 +00:00
GcByteArray* name;
if (*spec == '[') {
2014-06-28 23:24:24 +00:00
name = makeByteArray(t, length + 1);
memcpy(name->body().begin(), spec, length);
} else {
assertT(t, *spec == 'L');
assertT(t, spec[length - 1] == ';');
2014-06-28 23:24:24 +00:00
name = makeByteArray(t, length - 1);
memcpy(name->body().begin(), spec + 1, length - 2);
}
2014-06-28 21:11:31 +00:00
return resolveClass(t, method->class_()->loader(), name);
}
2014-07-11 15:47:57 +00:00
bool compatibleReturnType(MyThread* t, GcMethod* oldMethod, GcMethod* newMethod)
2009-05-23 22:15:06 +00:00
{
if (oldMethod == newMethod) {
return true;
2014-07-11 15:47:57 +00:00
} else if (oldMethod->returnCode() == newMethod->returnCode()) {
2014-05-29 04:17:25 +00:00
if (oldMethod->returnCode() == ObjectField) {
PROTECT(t, newMethod);
2009-05-23 22:15:06 +00:00
2014-05-29 04:17:25 +00:00
GcClass* oldClass = returnClass(t, oldMethod);
PROTECT(t, oldClass);
2014-05-29 04:17:25 +00:00
GcClass* newClass = returnClass(t, newMethod);
return isAssignableFrom(t, oldClass, newClass);
2009-05-23 22:15:06 +00:00
} else {
return true;
}
} else {
2014-05-29 04:17:25 +00:00
return oldMethod->returnCode() == VoidField;
2009-05-23 22:15:06 +00:00
}
}
2014-07-11 15:47:57 +00:00
void jumpAndInvoke(MyThread* t, GcMethod* method, void* stack, ...)
2009-05-23 22:15:06 +00:00
{
t->trace->targetMethod = 0;
2009-05-23 22:15:06 +00:00
2014-05-29 04:17:25 +00:00
if (method->flags() & ACC_NATIVE) {
t->trace->nativeMethod = method;
} else {
t->trace->nativeMethod = 0;
}
2009-05-23 22:15:06 +00:00
2014-05-29 04:17:25 +00:00
unsigned argumentCount = method->parameterFootprint();
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RUNTIME_ARRAY(t, uintptr_t, arguments, argumentCount);
2014-07-11 15:50:18 +00:00
va_list a;
va_start(a, stack);
for (unsigned i = 0; i < argumentCount; ++i) {
RUNTIME_ARRAY_BODY(arguments)[i] = va_arg(a, uintptr_t);
}
va_end(a);
2011-01-27 18:54:41 +00:00
assertT(t, t->exception == 0);
2011-01-27 18:54:41 +00:00
popResources(t);
2014-05-29 04:17:25 +00:00
2014-07-11 15:50:18 +00:00
vmJumpAndInvoke(
t,
reinterpret_cast<void*>(methodAddress(t, method)),
stack,
argumentCount * BytesPerWord,
RUNTIME_ARRAY_BODY(arguments),
(t->arch->alignFrameSize(t->arch->argumentFootprint(argumentCount))
+ t->arch->frameReturnAddressSize()) * BytesPerWord);
2009-05-23 22:15:06 +00:00
}
2014-07-11 15:47:57 +00:00
void callContinuation(MyThread* t,
GcContinuation* continuation,
object result,
GcThrowable* exception)
2009-05-23 22:15:06 +00:00
{
2014-07-11 15:50:18 +00:00
enum { Call, Unwind, Rewind } action;
2009-05-23 22:15:06 +00:00
2014-06-29 03:50:32 +00:00
GcContinuation* nextContinuation = 0;
2009-05-23 22:15:06 +00:00
if (t->continuation == 0
2014-07-11 15:47:57 +00:00
or t->continuation->context() != continuation->context()) {
2009-05-23 22:15:06 +00:00
PROTECT(t, continuation);
PROTECT(t, result);
PROTECT(t, exception);
2014-07-11 15:47:57 +00:00
if (compatibleReturnType(
t, t->trace->originalMethod, continuation->context()->method())) {
2014-06-29 03:50:32 +00:00
GcContinuationContext* oldContext;
GcContinuationContext* unwindContext;
2009-05-23 22:15:06 +00:00
if (t->continuation) {
2014-06-29 03:50:32 +00:00
oldContext = t->continuation->context();
unwindContext = oldContext;
} else {
oldContext = 0;
unwindContext = 0;
}
2014-06-29 03:50:32 +00:00
GcContinuationContext* rewindContext = 0;
2014-06-29 03:50:32 +00:00
for (GcContinuationContext* newContext = continuation->context();
2014-07-11 15:47:57 +00:00
newContext;
newContext = newContext->next()) {
if (newContext == oldContext) {
unwindContext = 0;
break;
} else {
rewindContext = newContext;
}
}
2014-07-11 15:47:57 +00:00
if (unwindContext and unwindContext->continuation()) {
nextContinuation
= cast<GcContinuation>(t, unwindContext->continuation());
result = makeUnwindResult(t, continuation, result, exception);
2009-05-23 22:15:06 +00:00
action = Unwind;
2014-07-11 15:47:57 +00:00
} else if (rewindContext and rewindContext->continuation()) {
nextContinuation
= cast<GcContinuation>(t, rewindContext->continuation());
action = Rewind;
if (compileRoots(t)->rewindMethod() == 0) {
PROTECT(t, nextContinuation);
2014-05-29 04:17:25 +00:00
2014-07-11 15:47:57 +00:00
GcMethod* method = resolveMethod(
t,
roots(t)->bootLoader(),
"avian/Continuations",
"rewind",
"(Ljava/lang/Runnable;Lavian/Callback;Ljava/lang/Object;"
"Ljava/lang/Throwable;)V");
PROTECT(t, method);
2014-05-29 04:17:25 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
compile(t, local::codeAllocator(t), 0, method);
2014-05-29 04:17:25 +00:00
2014-06-25 20:38:13 +00:00
compileRoots(t)->setRewindMethod(t, method);
2009-05-23 22:15:06 +00:00
}
} else {
action = Call;
}
} else {
2014-05-29 04:17:25 +00:00
throwNew(t, GcIncompatibleContinuationException::Type);
2009-05-23 22:15:06 +00:00
}
} else {
action = Call;
}
void* ip;
void* frame;
2009-05-23 22:15:06 +00:00
void* stack;
2014-06-29 03:50:32 +00:00
GcContinuation* threadContinuation;
findUnwindTarget(t, &ip, &frame, &stack, &threadContinuation);
2009-05-23 22:15:06 +00:00
switch (action) {
case Call: {
2014-06-29 04:57:07 +00:00
callContinuation(t, continuation, result, exception, ip, stack);
2009-05-23 22:15:06 +00:00
} break;
case Unwind: {
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
callContinuation(t, nextContinuation, result, 0, ip, stack);
2009-05-23 22:15:06 +00:00
} break;
case Rewind: {
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
transition(t, 0, 0, nextContinuation, t->trace);
2014-07-11 15:47:57 +00:00
jumpAndInvoke(t,
compileRoots(t)->rewindMethod(),
stack,
nextContinuation->context()->before(),
continuation,
result,
exception);
2009-05-23 22:15:06 +00:00
} break;
default:
abort(t);
}
}
2014-07-11 15:50:18 +00:00
void callWithCurrentContinuation(MyThread* t, object receiver)
{
2014-05-29 04:17:25 +00:00
GcMethod* method = 0;
void* ip = 0;
void* stack = 0;
2014-07-11 15:50:18 +00:00
{
PROTECT(t, receiver);
if (compileRoots(t)->receiveMethod() == 0) {
2014-07-11 15:47:57 +00:00
GcMethod* m = resolveMethod(t,
roots(t)->bootLoader(),
"avian/Function",
"call",
"(Ljava/lang/Object;)Ljava/lang/Object;");
if (m) {
2014-06-25 20:38:13 +00:00
compileRoots(t)->setReceiveMethod(t, m);
2014-05-29 04:17:25 +00:00
2014-06-28 23:24:24 +00:00
GcClass* continuationClass = type(t, GcContinuation::Type);
2014-06-28 23:24:24 +00:00
if (continuationClass->vmFlags() & BootstrapFlag) {
2014-06-29 04:57:07 +00:00
resolveSystemClass(
2014-06-30 01:44:41 +00:00
t, roots(t)->bootLoader(), continuationClass->name());
}
}
}
2014-07-11 15:47:57 +00:00
method = findInterfaceMethod(
t, compileRoots(t)->receiveMethod(), objectClass(t, receiver));
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
PROTECT(t, method);
2014-05-29 04:17:25 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
compile(t, local::codeAllocator(t), 0, method);
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
t->continuation = makeCurrentContinuation(t, &ip, &stack);
}
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
jumpAndInvoke(t, method, stack, receiver, t->continuation);
}
2014-07-11 15:50:18 +00:00
void dynamicWind(MyThread* t, object before, object thunk, object after)
{
void* ip = 0;
void* stack = 0;
2014-07-11 15:50:18 +00:00
{
PROTECT(t, before);
PROTECT(t, thunk);
PROTECT(t, after);
if (compileRoots(t)->windMethod() == 0) {
2014-07-11 15:47:57 +00:00
GcMethod* method = resolveMethod(
t,
roots(t)->bootLoader(),
"avian/Continuations",
"wind",
"(Ljava/lang/Runnable;Ljava/util/concurrent/Callable;"
"Ljava/lang/Runnable;)Lavian/Continuations$UnwindResult;");
if (method) {
2014-06-25 20:38:13 +00:00
compileRoots(t)->setWindMethod(t, method);
compile(t, local::codeAllocator(t), 0, method);
}
}
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
t->continuation = makeCurrentContinuation(t, &ip, &stack);
2014-07-11 15:47:57 +00:00
GcContinuationContext* newContext
= makeContinuationContext(t,
t->continuation->context(),
before,
after,
t->continuation,
t->trace->originalMethod);
2014-06-25 20:38:13 +00:00
t->continuation->setContext(t, newContext);
}
jumpAndInvoke(t, compileRoots(t)->windMethod(), stack, before, thunk, after);
}
2007-09-25 23:53:11 +00:00
class ArgumentList {
public:
2014-07-11 15:50:18 +00:00
ArgumentList(Thread* t,
uintptr_t* array,
unsigned size,
bool* objectMask,
object this_,
const char* spec,
bool indirectObjects,
va_list arguments)
: t(static_cast<MyThread*>(t)),
array(array),
objectMask(objectMask),
size(size),
position(0),
protector(this)
2007-09-25 23:53:11 +00:00
{
if (this_) {
addObject(this_);
}
for (MethodSpecIterator it(t, spec); it.hasNext();) {
switch (*it.next()) {
2007-09-25 23:53:11 +00:00
case 'L':
case '[':
if (indirectObjects) {
object* v = va_arg(arguments, object*);
addObject(v ? *v : 0);
} else {
addObject(va_arg(arguments, object));
}
break;
2014-05-29 04:17:25 +00:00
2007-09-25 23:53:11 +00:00
case 'J':
addLong(va_arg(arguments, uint64_t));
break;
case 'D':
addLong(doubleToBits(va_arg(arguments, double)));
break;
case 'F':
addInt(floatToBits(va_arg(arguments, double)));
break;
2007-09-25 23:53:11 +00:00
default:
addInt(va_arg(arguments, uint32_t));
2014-05-29 04:17:25 +00:00
break;
2007-09-25 23:53:11 +00:00
}
}
2007-09-25 23:53:11 +00:00
}
2014-07-11 15:50:18 +00:00
ArgumentList(Thread* t,
uintptr_t* array,
unsigned size,
bool* objectMask,
object this_,
const char* spec,
const jvalue* arguments)
: t(static_cast<MyThread*>(t)),
array(array),
objectMask(objectMask),
size(size),
position(0),
protector(this)
{
if (this_) {
addObject(this_);
}
unsigned index = 0;
for (MethodSpecIterator it(t, spec); it.hasNext();) {
switch (*it.next()) {
case 'L':
case '[': {
object* v = arguments[index++].l;
addObject(v ? *v : 0);
} break;
2014-05-29 04:17:25 +00:00
case 'J':
addLong(arguments[index++].j);
break;
case 'D':
addLong(doubleToBits(arguments[index++].d));
break;
case 'F':
addInt(floatToBits(arguments[index++].f));
break;
default:
addInt(arguments[index++].i);
2014-05-29 04:17:25 +00:00
break;
}
}
}
2014-07-11 15:50:18 +00:00
ArgumentList(Thread* t,
uintptr_t* array,
unsigned size,
bool* objectMask,
object this_,
const char* spec,
object arguments)
: t(static_cast<MyThread*>(t)),
array(array),
objectMask(objectMask),
size(size),
position(0),
protector(this)
2007-09-25 23:53:11 +00:00
{
if (this_) {
addObject(this_);
}
unsigned index = 0;
for (MethodSpecIterator it(t, spec); it.hasNext();) {
switch (*it.next()) {
2007-09-25 23:53:11 +00:00
case 'L':
case '[':
addObject(objectArrayBody(t, arguments, index++));
break;
2014-05-29 04:17:25 +00:00
2007-09-25 23:53:11 +00:00
case 'J':
case 'D':
2014-07-11 15:50:18 +00:00
addLong(
fieldAtOffset<int64_t>(objectArrayBody(t, arguments, index++), 8));
2007-09-25 23:53:11 +00:00
break;
default:
2013-02-11 00:38:51 +00:00
addInt(fieldAtOffset<int32_t>(objectArrayBody(t, arguments, index++),
2014-07-11 15:50:18 +00:00
BytesPerWord));
break;
2007-09-25 23:53:11 +00:00
}
}
}
2014-07-11 15:50:18 +00:00
void addObject(object v)
{
assertT(t, position < size);
2007-09-25 23:53:11 +00:00
array[position] = reinterpret_cast<uintptr_t>(v);
objectMask[position] = true;
2014-07-11 15:50:18 +00:00
++position;
2007-09-25 23:53:11 +00:00
}
2014-07-11 15:50:18 +00:00
void addInt(uintptr_t v)
{
assertT(t, position < size);
2007-09-25 23:53:11 +00:00
array[position] = v;
objectMask[position] = false;
2014-07-11 15:50:18 +00:00
++position;
2007-09-25 23:53:11 +00:00
}
2014-07-11 15:50:18 +00:00
void addLong(uint64_t v)
{
assertT(t, position < size - 1);
2009-05-03 20:57:11 +00:00
memcpy(array + position, &v, 8);
2007-09-25 23:53:11 +00:00
objectMask[position] = false;
2007-12-23 20:06:24 +00:00
objectMask[position + 1] = false;
2009-05-03 20:57:11 +00:00
position += 2;
2007-09-25 23:53:11 +00:00
}
MyThread* t;
uintptr_t* array;
bool* objectMask;
unsigned size;
2007-09-25 23:53:11 +00:00
unsigned position;
2014-07-11 15:50:18 +00:00
class MyProtector : public Thread::Protector {
public:
2014-07-11 15:50:18 +00:00
MyProtector(ArgumentList* list) : Protector(list->t), list(list)
{
}
2014-07-11 15:50:18 +00:00
virtual void visit(Heap::Visitor* v)
{
2009-05-17 23:43:48 +00:00
for (unsigned i = 0; i < list->position; ++i) {
if (list->objectMask[i]) {
v->visit(reinterpret_cast<object*>(list->array + i));
}
}
}
ArgumentList* list;
} protector;
2007-09-25 23:53:11 +00:00
};
2014-07-11 15:47:57 +00:00
object invoke(Thread* thread, GcMethod* method, ArgumentList* arguments)
2007-09-25 23:53:11 +00:00
{
MyThread* t = static_cast<MyThread*>(thread);
if (false) {
PROTECT(t, method);
2014-07-11 15:47:57 +00:00
compile(
t,
local::codeAllocator(static_cast<MyThread*>(t)),
0,
resolveMethod(
t, roots(t)->appLoader(), "foo/ClassName", "methodName", "()V"));
}
uintptr_t stackLimit = t->stackLimit;
uintptr_t stackPosition = reinterpret_cast<uintptr_t>(&t);
if (stackLimit == 0) {
2012-03-14 18:36:42 +00:00
t->stackLimit = stackPosition - t->m->stackSizeInBytes;
} else if (stackPosition < stackLimit) {
2014-05-29 04:17:25 +00:00
throwNew(t, GcStackOverflowError::Type);
}
2014-07-11 15:50:18 +00:00
THREAD_RESOURCE(t,
uintptr_t,
stackLimit,
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
static_cast<MyThread*>(t)->stackLimit = stackLimit);
2014-05-29 04:17:25 +00:00
unsigned returnCode = method->returnCode();
2007-09-25 23:53:11 +00:00
unsigned returnType = fieldType(t, returnCode);
2007-12-30 22:24:48 +00:00
uint64_t result;
2007-09-30 02:48:27 +00:00
2014-07-11 15:50:18 +00:00
{
MyThread::CallTrace trace(t, method);
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
MyCheckpoint checkpoint(t);
assertT(t, arguments->position == arguments->size);
2014-07-11 15:50:18 +00:00
result = vmInvoke(
t,
reinterpret_cast<void*>(methodAddress(t, method)),
arguments->array,
arguments->position * BytesPerWord,
t->arch->alignFrameSize(t->arch->argumentFootprint(arguments->position))
* BytesPerWord,
returnType);
2007-12-30 22:24:48 +00:00
}
2007-09-25 23:53:11 +00:00
2014-05-29 04:17:25 +00:00
if (t->exception) {
if (UNLIKELY(t->getFlags() & Thread::UseBackupHeapFlag)) {
collect(t, Heap::MinorCollection);
}
2014-05-29 04:17:25 +00:00
2014-06-28 23:24:24 +00:00
GcThrowable* exception = t->exception;
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
t->exception = 0;
vm::throw_(t, exception);
}
2007-09-25 23:53:11 +00:00
object r;
switch (returnCode) {
case ByteField:
case BooleanField:
case CharField:
case ShortField:
case FloatField:
case IntField:
r = makeInt(t, result);
2007-09-25 23:53:11 +00:00
break;
case LongField:
case DoubleField:
r = makeLong(t, result);
2007-09-25 23:53:11 +00:00
break;
case ObjectField:
2007-12-16 00:24:15 +00:00
r = reinterpret_cast<object>(result);
2007-09-25 23:53:11 +00:00
break;
case VoidField:
r = 0;
break;
default:
abort(t);
}
return r;
}
2014-07-11 15:50:18 +00:00
class SignalHandler : public SignalRegistrar::Handler {
2007-12-30 22:24:48 +00:00
public:
2014-06-26 02:17:27 +00:00
typedef GcThrowable* (GcRoots::*ExceptionGetter)();
2014-07-11 15:47:57 +00:00
SignalHandler(Gc::Type type, ExceptionGetter exc, unsigned fixedSize)
: m(0), type(type), exc(exc), fixedSize(fixedSize)
{
}
2007-12-30 22:24:48 +00:00
void setException(MyThread* t) {
if (ensure(t, pad(fixedSize) + traceSize(t))) {
t->setFlag(Thread::TracingFlag);
t->exception = makeThrowable(t, type);
t->clearFlag(Thread::TracingFlag);
} else {
// not enough memory available for a new exception and stack
// trace -- use a preallocated instance instead
t->exception = (vm::roots(t)->*exc)();
}
}
2014-07-11 15:50:18 +00:00
virtual bool handleSignal(void** ip,
void** frame,
void** stack,
void** thread)
{
2007-12-30 22:24:48 +00:00
MyThread* t = static_cast<MyThread*>(m->localThread->get());
if (t and t->state == Thread::ActiveState) {
if (t->getFlags() & Thread::TryNativeFlag) {
setException(t);
popResources(t);
GcContinuation* continuation;
findUnwindTarget(t, ip, frame, stack, &continuation);
t->trace->targetMethod = 0;
t->trace->nativeMethod = 0;
transition(t, *ip, *stack, continuation, t->trace);
*thread = t;
return true;
} else if (methodForIp(t, *ip)) {
2009-09-04 23:08:45 +00:00
// add one to the IP since findLineNumber will subtract one
// when we make the trace:
2014-07-11 15:50:18 +00:00
MyThread::TraceContext context(
t,
static_cast<uint8_t*>(*ip) + 1,
static_cast<void**>(*stack) - t->arch->frameReturnAddressSize(),
t->continuation,
t->trace);
2008-04-09 19:08:13 +00:00
setException(t);
2008-01-02 01:07:12 +00:00
// printTrace(t, t->exception);
2014-06-29 03:50:32 +00:00
GcContinuation* continuation;
findUnwindTarget(t, ip, frame, stack, &continuation);
2008-04-23 16:33:31 +00:00
transition(t, *ip, *stack, continuation, t->trace);
2008-04-23 16:33:31 +00:00
2008-01-02 01:07:12 +00:00
*thread = t;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
2008-01-02 01:07:12 +00:00
return true;
}
2007-12-30 22:24:48 +00:00
}
if (compileLog) {
fflush(compileLog);
}
2008-01-02 01:07:12 +00:00
return false;
2007-12-30 22:24:48 +00:00
}
Machine* m;
2014-05-29 04:17:25 +00:00
Gc::Type type;
2014-06-30 01:44:41 +00:00
ExceptionGetter exc;
unsigned fixedSize;
2007-12-30 22:24:48 +00:00
};
2014-07-11 15:50:18 +00:00
bool isThunk(MyThread* t, void* ip);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
2014-07-11 15:50:18 +00:00
bool isVirtualThunk(MyThread* t, void* ip);
2014-07-11 15:50:18 +00:00
bool isThunkUnsafeStack(MyThread* t, void* ip);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
2014-07-11 15:50:18 +00:00
void boot(MyThread* t, BootImage* image, uint8_t* code);
2008-11-23 23:58:01 +00:00
class MyProcessor;
2014-07-11 15:50:18 +00:00
MyProcessor* processor(MyThread* t);
#ifndef AVIAN_AOT_ONLY
2014-07-11 15:50:18 +00:00
void compileThunks(MyThread* t, FixedAllocator* allocator);
#endif
2012-05-02 15:49:31 +00:00
class CompilationHandlerList {
2014-07-11 15:50:18 +00:00
public:
CompilationHandlerList(CompilationHandlerList* next,
Processor::CompilationHandler* handler)
: next(next), handler(handler)
{
}
2012-05-02 15:49:31 +00:00
2014-07-11 15:50:18 +00:00
void dispose(Allocator* allocator)
{
if (this) {
2012-05-02 15:49:31 +00:00
next->dispose(allocator);
handler->dispose();
allocator->free(this, sizeof(*this));
}
}
CompilationHandlerList* next;
Processor::CompilationHandler* handler;
};
2014-07-11 15:50:18 +00:00
template <class T, class C>
int checkConstant(MyThread* t, size_t expected, T C::*field, const char* name)
{
size_t actual = reinterpret_cast<uint8_t*>(&(t->*field))
- reinterpret_cast<uint8_t*>(t);
if (expected != actual) {
2013-12-19 05:25:23 +00:00
fprintf(stderr,
"constant mismatch (%s): \n\tconstant says: %d\n\tc++ compiler "
"says: %d\n",
name,
(unsigned)expected,
(unsigned)actual);
return 1;
}
return 0;
}
2014-07-11 15:50:18 +00:00
class MyProcessor : public Processor {
public:
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
class Thunk {
public:
2014-07-11 15:50:18 +00:00
Thunk() : start(0), frameSavedOffset(0), length(0)
{
}
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
2014-07-11 15:50:18 +00:00
Thunk(uint8_t* start, unsigned frameSavedOffset, unsigned length)
: start(start), frameSavedOffset(frameSavedOffset), length(length)
{
}
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
uint8_t* start;
unsigned frameSavedOffset;
unsigned length;
};
class ThunkCollection {
public:
Thunk default_;
Thunk defaultVirtual;
Thunk native;
Thunk aioob;
Thunk stackOverflow;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
Thunk table;
};
2014-02-22 00:06:17 +00:00
MyProcessor(System* s,
Allocator* allocator,
const char* crashDumpDirectory,
bool useNativeFeatures)
: s(s),
allocator(allocator),
roots(0),
bootImage(0),
heapImage(0),
codeImage(0),
codeImageSize(0),
2014-05-29 04:17:25 +00:00
segFaultHandler(GcNullPointerException::Type,
2014-06-30 01:44:41 +00:00
&GcRoots::nullPointerException,
2014-05-29 04:17:25 +00:00
GcNullPointerException::FixedSize),
divideByZeroHandler(GcArithmeticException::Type,
2014-06-30 01:44:41 +00:00
&GcRoots::arithmeticException,
2014-05-29 04:17:25 +00:00
GcArithmeticException::FixedSize),
2014-02-25 22:46:35 +00:00
codeAllocator(s, Slice<uint8_t>(0, 0)),
2014-02-22 00:06:17 +00:00
callTableSize(0),
useNativeFeatures(useNativeFeatures),
compilationHandlers(0)
{
thunkTable[compileMethodIndex] = voidPointer(local::compileMethod);
thunkTable[compileVirtualMethodIndex] = voidPointer(compileVirtualMethod);
thunkTable[invokeNativeIndex] = voidPointer(invokeNative);
2014-07-11 15:50:18 +00:00
thunkTable[throwArrayIndexOutOfBoundsIndex]
= voidPointer(throwArrayIndexOutOfBounds);
thunkTable[throwStackOverflowIndex] = voidPointer(throwStackOverflow);
using namespace avian::codegen::runtime;
#define THUNK(s) thunkTable[s##Index] = voidPointer(s);
#include "thunks.cpp"
#undef THUNK
// Set the dummyIndex entry to a constant which should require the
// maximum number of bytes to represent in assembly code
// (i.e. can't be represented by a smaller number of bytes and
// implicitly sign- or zero-extended). We'll use this property
// later to determine the maximum size of a thunk in the thunk
// table.
2014-07-11 15:50:18 +00:00
thunkTable[dummyIndex] = reinterpret_cast<void*>(
static_cast<uintptr_t>(UINT64_C(0x5555555555555555)));
2014-02-22 00:06:17 +00:00
signals.setCrashDumpDirectory(crashDumpDirectory);
}
2014-07-11 15:47:57 +00:00
virtual Thread* makeThread(Machine* m, GcThread* javaThread, Thread* parent)
2007-09-25 23:53:11 +00:00
{
2014-07-11 15:50:18 +00:00
MyThread* t = new (m->heap->allocate(sizeof(MyThread))) MyThread(
m, javaThread, static_cast<MyThread*>(parent), useNativeFeatures);
t->heapImage = heapImage;
t->codeImage = codeImage;
t->thunkTable = thunkTable;
2009-05-05 01:04:17 +00:00
#if TARGET_BYTES_PER_WORD == BYTES_PER_WORD
2013-12-19 05:25:23 +00:00
int mismatches
= checkConstant(t,
TARGET_THREAD_EXCEPTION,
&Thread::exception,
"TARGET_THREAD_EXCEPTION")
+ checkConstant(t,
TARGET_THREAD_EXCEPTIONSTACKADJUSTMENT,
&MyThread::exceptionStackAdjustment,
"TARGET_THREAD_EXCEPTIONSTACKADJUSTMENT")
+ checkConstant(t,
TARGET_THREAD_EXCEPTIONOFFSET,
&MyThread::exceptionOffset,
"TARGET_THREAD_EXCEPTIONOFFSET")
+ checkConstant(t,
TARGET_THREAD_EXCEPTIONHANDLER,
&MyThread::exceptionHandler,
"TARGET_THREAD_EXCEPTIONHANDLER")
+ checkConstant(
t, TARGET_THREAD_IP, &MyThread::ip, "TARGET_THREAD_IP")
+ checkConstant(
t, TARGET_THREAD_STACK, &MyThread::stack, "TARGET_THREAD_STACK")
+ checkConstant(t,
TARGET_THREAD_NEWSTACK,
&MyThread::newStack,
"TARGET_THREAD_NEWSTACK")
+ checkConstant(t,
TARGET_THREAD_TAILADDRESS,
&MyThread::tailAddress,
"TARGET_THREAD_TAILADDRESS")
+ checkConstant(t,
TARGET_THREAD_VIRTUALCALLTARGET,
&MyThread::virtualCallTarget,
"TARGET_THREAD_VIRTUALCALLTARGET")
+ checkConstant(t,
TARGET_THREAD_VIRTUALCALLINDEX,
&MyThread::virtualCallIndex,
"TARGET_THREAD_VIRTUALCALLINDEX")
+ checkConstant(t,
TARGET_THREAD_HEAPIMAGE,
&MyThread::heapImage,
"TARGET_THREAD_HEAPIMAGE")
+ checkConstant(t,
TARGET_THREAD_CODEIMAGE,
&MyThread::codeImage,
2013-12-19 05:25:23 +00:00
"TARGET_THREAD_CODEIMAGE")
+ checkConstant(t,
TARGET_THREAD_THUNKTABLE,
&MyThread::thunkTable,
"TARGET_THREAD_THUNKTABLE")
+ checkConstant(t,
TARGET_THREAD_STACKLIMIT,
&MyThread::stackLimit,
"TARGET_THREAD_STACKLIMIT");
2014-07-11 15:50:18 +00:00
if (mismatches > 0) {
fprintf(stderr, "%d constant mismatches\n", mismatches);
abort(t);
2009-05-25 00:22:36 +00:00
}
2014-06-28 00:32:20 +00:00
expect(t, TargetClassArrayElementSize == ClassArrayElementSize);
expect(t, TargetClassFixedSize == ClassFixedSize);
expect(t, TargetClassVtable == ClassVtable);
#endif
t->init();
return t;
2007-09-25 23:53:11 +00:00
}
2014-07-11 15:47:57 +00:00
virtual GcMethod* makeMethod(vm::Thread* t,
uint8_t vmFlags,
uint8_t returnCode,
uint8_t parameterCount,
uint8_t parameterFootprint,
uint16_t flags,
uint16_t offset,
GcByteArray* name,
GcByteArray* spec,
GcMethodAddendum* addendum,
GcClass* class_,
GcCode* code)
2007-10-04 03:19:39 +00:00
{
if (code) {
2014-05-29 04:17:25 +00:00
code->compiled() = local::defaultThunk(static_cast<MyThread*>(t));
}
2014-05-29 04:17:25 +00:00
return vm::makeMethod(t,
vmFlags,
returnCode,
parameterCount,
parameterFootprint,
flags,
offset,
0,
0,
name,
spec,
addendum,
class_,
2014-06-28 04:00:05 +00:00
code);
2007-10-04 03:19:39 +00:00
}
2014-07-11 15:47:57 +00:00
virtual GcClass* makeClass(vm::Thread* t,
uint16_t flags,
uint16_t vmFlags,
uint16_t fixedSize,
uint8_t arrayElementSize,
uint8_t arrayDimensions,
GcClass* arrayElementClass,
GcIntArray* objectMask,
GcByteArray* name,
GcByteArray* sourceFile,
GcClass* super,
object interfaceTable,
object virtualTable,
object fieldTable,
object methodTable,
GcClassAddendum* addendum,
GcSingleton* staticTable,
GcClassLoader* loader,
unsigned vtableLength)
{
2014-05-29 04:17:25 +00:00
return vm::makeClass(t,
flags,
vmFlags,
fixedSize,
arrayElementSize,
arrayDimensions,
2014-06-28 00:32:20 +00:00
arrayElementClass,
2014-05-29 04:17:25 +00:00
0,
objectMask,
name,
sourceFile,
super,
2014-05-29 04:17:25 +00:00
interfaceTable,
virtualTable,
fieldTable,
methodTable,
addendum,
2014-06-28 00:32:20 +00:00
staticTable,
loader,
2014-05-29 04:17:25 +00:00
0,
vtableLength);
2007-12-11 21:26:59 +00:00
}
2014-07-11 15:47:57 +00:00
virtual void initVtable(Thread* t, GcClass* c)
2007-12-11 21:26:59 +00:00
{
PROTECT(t, c);
2014-05-29 04:17:25 +00:00
for (int i = c->length() - 1; i >= 0; --i) {
2014-07-11 15:50:18 +00:00
void* thunk
= reinterpret_cast<void*>(virtualThunk(static_cast<MyThread*>(t), i));
2014-06-29 04:57:07 +00:00
c->vtable()[i] = thunk;
}
}
2014-07-11 15:50:18 +00:00
virtual void visitObjects(Thread* vmt, Heap::Visitor* v)
2007-09-25 23:53:11 +00:00
{
MyThread* t = static_cast<MyThread*>(vmt);
2007-12-09 22:45:43 +00:00
if (t == t->m->rootThread) {
v->visit(&roots);
}
2007-09-25 23:53:11 +00:00
for (MyThread::CallTrace* trace = t->trace; trace; trace = trace->next) {
2009-05-03 20:57:11 +00:00
v->visit(&(trace->continuation));
v->visit(&(trace->nativeMethod));
v->visit(&(trace->targetMethod));
v->visit(&(trace->originalMethod));
}
2008-04-01 17:37:59 +00:00
2009-05-03 20:57:11 +00:00
v->visit(&(t->continuation));
2007-12-09 22:45:43 +00:00
for (Reference* r = t->reference; r; r = r->next) {
v->visit(&(r->target));
}
2007-09-25 23:53:11 +00:00
2007-12-09 22:45:43 +00:00
visitStack(t, v);
2007-09-25 23:53:11 +00:00
}
2014-07-11 15:50:18 +00:00
virtual void walkStack(Thread* vmt, StackVisitor* v)
2007-09-25 23:53:11 +00:00
{
2007-12-09 22:45:43 +00:00
MyThread* t = static_cast<MyThread*>(vmt);
2007-09-25 23:53:11 +00:00
2007-12-09 22:45:43 +00:00
MyStackWalker walker(t);
walker.walk(v);
2007-09-25 23:53:11 +00:00
}
2014-07-11 15:47:57 +00:00
virtual int lineNumber(Thread* vmt, GcMethod* method, int ip)
2007-10-04 22:41:19 +00:00
{
2007-12-09 22:45:43 +00:00
return findLineNumber(static_cast<MyThread*>(vmt), method, ip);
2007-10-04 22:41:19 +00:00
}
2014-07-11 15:50:18 +00:00
virtual object* makeLocalReference(Thread* vmt, object o)
2007-09-25 23:53:11 +00:00
{
if (o) {
MyThread* t = static_cast<MyThread*>(vmt);
for (Reference* r = t->reference; r; r = r->next) {
if (r->target == o) {
acquire(t, r);
return &(r->target);
}
}
2008-04-13 18:15:04 +00:00
Reference* r = new (t->m->heap->allocate(sizeof(Reference)))
2014-07-11 15:50:18 +00:00
Reference(o, &(t->reference), false);
acquire(t, r);
return &(r->target);
} else {
return 0;
}
2007-09-25 23:53:11 +00:00
}
2014-07-11 15:50:18 +00:00
virtual void disposeLocalReference(Thread* t, object* r)
2007-09-25 23:53:11 +00:00
{
if (r) {
release(t, reinterpret_cast<Reference*>(r));
}
2007-09-25 23:53:11 +00:00
}
2014-07-11 15:50:18 +00:00
virtual bool pushLocalFrame(Thread* vmt, unsigned)
{
MyThread* t = static_cast<MyThread*>(vmt);
2014-07-11 15:50:18 +00:00
t->referenceFrame = new (t->m->heap->allocate(sizeof(List<Reference*>)))
List<Reference*>(t->reference, t->referenceFrame);
2014-05-29 04:17:25 +00:00
return true;
}
2014-07-11 15:50:18 +00:00
virtual void popLocalFrame(Thread* vmt)
{
MyThread* t = static_cast<MyThread*>(vmt);
List<Reference*>* f = t->referenceFrame;
t->referenceFrame = f->next;
while (t->reference != f->item) {
vm::dispose(t, t->reference);
}
t->m->heap->free(f, sizeof(List<Reference*>));
}
2014-07-11 15:47:57 +00:00
virtual object invokeArray(Thread* t,
GcMethod* method,
object this_,
object arguments)
{
assertT(t, t->exception == 0);
2008-04-01 17:37:59 +00:00
2014-07-11 15:47:57 +00:00
assertT(
t,
t->state == Thread::ActiveState or t->state == Thread::ExclusiveState);
assertT(t, ((method->flags() & ACC_STATIC) == 0) xor (this_ == 0));
method = findMethod(t, method, this_);
2014-07-11 15:47:57 +00:00
const char* spec = reinterpret_cast<char*>(method->spec()->body().begin());
2007-09-25 23:53:11 +00:00
2014-05-29 04:17:25 +00:00
unsigned size = method->parameterFootprint();
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RUNTIME_ARRAY(t, uintptr_t, array, size);
THREAD_RUNTIME_ARRAY(t, bool, objectMask, size);
2014-07-11 15:50:18 +00:00
ArgumentList list(t,
RUNTIME_ARRAY_BODY(array),
size,
RUNTIME_ARRAY_BODY(objectMask),
this_,
spec,
arguments);
2014-05-29 04:17:25 +00:00
2007-12-09 22:45:43 +00:00
PROTECT(t, method);
compile(static_cast<MyThread*>(t),
2014-07-11 15:50:18 +00:00
local::codeAllocator(static_cast<MyThread*>(t)),
0,
method);
2007-12-09 22:45:43 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
return local::invoke(t, method, &list);
}
2014-07-11 15:47:57 +00:00
virtual object invokeArray(Thread* t,
GcMethod* method,
object this_,
const jvalue* arguments)
{
assertT(t, t->exception == 0);
2014-07-11 15:47:57 +00:00
assertT(
t,
t->state == Thread::ActiveState or t->state == Thread::ExclusiveState);
assertT(t, ((method->flags() & ACC_STATIC) == 0) xor (this_ == 0));
2014-05-29 04:17:25 +00:00
method = findMethod(t, method, this_);
2014-07-11 15:47:57 +00:00
const char* spec = reinterpret_cast<char*>(method->spec()->body().begin());
2014-05-29 04:17:25 +00:00
unsigned size = method->parameterFootprint();
THREAD_RUNTIME_ARRAY(t, uintptr_t, array, size);
THREAD_RUNTIME_ARRAY(t, bool, objectMask, size);
2014-07-11 15:50:18 +00:00
ArgumentList list(t,
RUNTIME_ARRAY_BODY(array),
size,
RUNTIME_ARRAY_BODY(objectMask),
this_,
spec,
arguments);
PROTECT(t, method);
compile(static_cast<MyThread*>(t),
2014-07-11 15:50:18 +00:00
local::codeAllocator(static_cast<MyThread*>(t)),
0,
method);
return local::invoke(t, method, &list);
}
2014-07-11 15:47:57 +00:00
virtual object invokeList(Thread* t,
GcMethod* method,
object this_,
bool indirectObjects,
va_list arguments)
{
assertT(t, t->exception == 0);
2008-04-01 17:37:59 +00:00
2014-07-11 15:47:57 +00:00
assertT(
t,
t->state == Thread::ActiveState or t->state == Thread::ExclusiveState);
assertT(t, ((method->flags() & ACC_STATIC) == 0) xor (this_ == 0));
2014-05-29 04:17:25 +00:00
method = findMethod(t, method, this_);
2014-07-11 15:47:57 +00:00
const char* spec = reinterpret_cast<char*>(method->spec()->body().begin());
2007-09-25 23:53:11 +00:00
2014-05-29 04:17:25 +00:00
unsigned size = method->parameterFootprint();
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RUNTIME_ARRAY(t, uintptr_t, array, size);
THREAD_RUNTIME_ARRAY(t, bool, objectMask, size);
2014-07-11 15:50:18 +00:00
ArgumentList list(t,
RUNTIME_ARRAY_BODY(array),
size,
RUNTIME_ARRAY_BODY(objectMask),
this_,
spec,
indirectObjects,
arguments);
2007-12-09 22:45:43 +00:00
PROTECT(t, method);
compile(static_cast<MyThread*>(t),
2014-07-11 15:50:18 +00:00
local::codeAllocator(static_cast<MyThread*>(t)),
0,
method);
2007-12-09 22:45:43 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
return local::invoke(t, method, &list);
}
2014-07-11 15:47:57 +00:00
virtual object invokeList(Thread* t,
GcClassLoader* loader,
const char* className,
const char* methodName,
const char* methodSpec,
object this_,
va_list arguments)
{
assertT(t, t->exception == 0);
2008-04-01 17:37:59 +00:00
2014-07-11 15:47:57 +00:00
assertT(
t,
t->state == Thread::ActiveState or t->state == Thread::ExclusiveState);
unsigned size = parameterFootprint(t, methodSpec, this_ == 0);
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
THREAD_RUNTIME_ARRAY(t, uintptr_t, array, size);
THREAD_RUNTIME_ARRAY(t, bool, objectMask, size);
2014-07-11 15:50:18 +00:00
ArgumentList list(t,
RUNTIME_ARRAY_BODY(array),
size,
RUNTIME_ARRAY_BODY(objectMask),
this_,
methodSpec,
false,
arguments);
2014-07-11 15:47:57 +00:00
GcMethod* method
= resolveMethod(t, loader, className, methodName, methodSpec);
assertT(t, ((method->flags() & ACC_STATIC) == 0) xor (this_ == 0));
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
PROTECT(t, method);
2014-05-29 04:17:25 +00:00
compile(static_cast<MyThread*>(t),
2014-07-11 15:47:57 +00:00
local::codeAllocator(static_cast<MyThread*>(t)),
0,
method);
2007-10-03 00:22:48 +00:00
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
return local::invoke(t, method, &list);
2007-12-09 22:45:43 +00:00
}
2007-10-03 00:22:48 +00:00
2014-07-11 15:50:18 +00:00
virtual void dispose(Thread* vmt)
{
2007-12-30 22:24:48 +00:00
MyThread* t = static_cast<MyThread*>(vmt);
2007-12-11 21:26:59 +00:00
while (t->reference) {
vm::dispose(t, t->reference);
}
t->arch->release();
2008-04-13 18:15:04 +00:00
t->m->heap->free(t, sizeof(*t));
2007-12-11 21:26:59 +00:00
}
2014-07-11 15:50:18 +00:00
virtual void dispose()
{
2014-02-25 22:46:35 +00:00
if (codeAllocator.memory.begin()) {
#ifndef AVIAN_AOT_ONLY
Memory::free(codeAllocator.memory);
#endif
}
2012-05-02 15:49:31 +00:00
compilationHandlers->dispose(allocator);
2014-02-22 06:23:01 +00:00
signals.unregisterHandler(SignalRegistrar::SegFault);
signals.unregisterHandler(SignalRegistrar::DivideByZero);
2014-02-22 00:06:17 +00:00
signals.setCrashDumpDirectory(0);
this->~MyProcessor();
2008-04-13 18:15:04 +00:00
allocator->free(this, sizeof(*this));
}
2008-04-09 19:08:13 +00:00
2014-07-11 15:50:18 +00:00
virtual object getStackTrace(Thread* vmt, Thread* vmTarget)
{
2008-04-09 19:08:13 +00:00
MyThread* t = static_cast<MyThread*>(vmt);
MyThread* target = static_cast<MyThread*>(vmTarget);
2008-12-02 02:38:00 +00:00
MyProcessor* p = this;
2014-07-11 15:50:18 +00:00
class Visitor : public System::ThreadVisitor {
2008-04-09 19:08:13 +00:00
public:
2014-07-11 15:50:18 +00:00
Visitor(MyThread* t, MyProcessor* p, MyThread* target)
: t(t), p(p), target(target), trace(0)
{
}
2008-04-09 19:08:13 +00:00
2014-07-11 15:50:18 +00:00
virtual void visit(void* ip, void* stack, void* link)
{
MyThread::TraceContext c(target, link);
2008-04-09 19:08:13 +00:00
if (methodForIp(t, ip)) {
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
// we caught the thread in Java code - use the register values
c.ip = ip;
c.stack = stack;
fix a couple of subtle Thread.getStackTrace bugs The first problem was that, on x86, we failed to properly keep track of whether to expect the return address to be on the stack or not when unwinding through a frame. We were relying on a "stackLimit" pointer to tell us whether we were looking at the most recently-called frame by comparing it with the stack pointer for that frame. That was inaccurate in the case of a thread executing at the beginning of a method before a new frame is allocated, in which case the most recent two frames share a stack pointer, confusing the unwinder. The solution involves keeping track of how many frames we've looked at while walking the stack. The other problem was that compareIpToMethodBounds assumed every method was followed by at least one byte of padding before the next method started. That assumption was usually valid because we were storing the size following method code prior to the code itself. However, the last method of an AOT-compiled code image is not followed by any such method header and may instead be followed directly by native code with no intervening padding. In that case, we risk interpreting that native code as part of the preceding method, with potentially bizarre results. The reason for the compareIpToMethodBounds assumption was that methods which throw exceptions as their last instruction generate a non-returning call, which nonetheless push a return address on the stack which points past the end of the method, and the unwinder needs to know that return address belongs to that method. A better solution is to add an extra trap instruction to the end of such methods, which is what this patch does.
2012-05-05 00:35:13 +00:00
c.methodIsMostRecent = true;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
} else if (target->transition) {
// we caught the thread in native code while in the middle
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
// of updating the context fields (MyThread::stack, etc.)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
static_cast<MyThread::Context&>(c) = *(target->transition);
} else if (isVmInvokeUnsafeStack(ip)) {
// we caught the thread in native code just after returning
// from java code, but before clearing MyThread::stack
// (which now contains a garbage value), and the most recent
// Java frame, if any, can be found in
// MyThread::continuation or MyThread::trace
c.ip = 0;
c.stack = 0;
2014-07-11 15:50:18 +00:00
} else if (target->stack and (not isThunkUnsafeStack(t, ip))
and (not isVirtualThunk(t, ip))) {
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
// we caught the thread in a thunk or native code, and the
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
// saved stack pointer indicates the most recent Java frame
// on the stack
c.ip = getIp(target);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
c.stack = target->stack;
} else if (isThunk(t, ip) or isVirtualThunk(t, ip)) {
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
// we caught the thread in a thunk where the stack register
// indicates the most recent Java frame on the stack
2014-04-29 19:26:40 +00:00
// On e.g. x86, the return address will have already been
// pushed onto the stack, in which case we use getIp to
2014-04-29 19:26:40 +00:00
// retrieve it. On e.g. ARM, it will be in the
// link register. Note that we can't just check if the link
// argument is null here, since we use ecx/rcx as a
// pseudo-link register on x86 for the purpose of tail
// calls.
c.ip = t->arch->hasLinkRegister() ? link : getIp(t, link, stack);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
c.stack = stack;
} else {
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
// we caught the thread in native code, and the most recent
// Java frame, if any, can be found in
// MyThread::continuation or MyThread::trace
c.ip = 0;
c.stack = 0;
}
2008-04-09 19:08:13 +00:00
if (ensure(t, traceSize(target))) {
t->setFlag(Thread::TracingFlag);
trace = makeTrace(t, target);
t->clearFlag(Thread::TracingFlag);
}
2008-04-09 19:08:13 +00:00
}
MyThread* t;
MyProcessor* p;
2008-04-09 19:08:13 +00:00
MyThread* target;
object trace;
} visitor(t, p, target);
2008-04-09 19:08:13 +00:00
t->m->system->visit(t->systemThread, target->systemThread, &visitor);
if (UNLIKELY(t->getFlags() & Thread::UseBackupHeapFlag)) {
2008-04-09 19:08:13 +00:00
PROTECT(t, visitor.trace);
collect(t, Heap::MinorCollection);
}
return visitor.trace ? visitor.trace : makeObjectArray(t, 0);
2008-04-09 19:08:13 +00:00
}
2008-11-23 23:58:01 +00:00
2014-02-25 22:46:35 +00:00
virtual void initialize(BootImage* image, Slice<uint8_t> code)
{
2009-06-01 03:16:58 +00:00
bootImage = image;
2014-02-25 22:46:35 +00:00
codeAllocator.memory = code;
2008-11-23 23:58:01 +00:00
}
2014-07-11 15:50:18 +00:00
virtual void addCompilationHandler(CompilationHandler* handler)
{
2013-12-19 05:25:23 +00:00
compilationHandlers
= new (allocator->allocate(sizeof(CompilationHandlerList)))
CompilationHandlerList(compilationHandlers, handler);
2012-05-02 15:49:31 +00:00
}
2014-07-11 15:47:57 +00:00
virtual void compileMethod(Thread* vmt,
Zone* zone,
GcTriple** constants,
GcTriple** calls,
avian::codegen::DelayedPromise** addresses,
GcMethod* method,
OffsetResolver* resolver)
2008-11-23 23:58:01 +00:00
{
MyThread* t = static_cast<MyThread*>(vmt);
2014-06-29 04:57:07 +00:00
BootContext bootContext(t, *constants, *calls, *addresses, zone, resolver);
2008-11-23 23:58:01 +00:00
compile(t, &codeAllocator, &bootContext, method);
2008-11-23 23:58:01 +00:00
2014-06-29 04:57:07 +00:00
*constants = bootContext.constants;
*calls = bootContext.calls;
*addresses = bootContext.addresses;
2008-11-23 23:58:01 +00:00
}
2014-07-11 15:50:18 +00:00
virtual void visitRoots(Thread* t, HeapWalker* w)
{
2014-07-11 15:47:57 +00:00
bootImage->methodTree = w->visitRoot(compileRoots(t)->methodTree());
bootImage->methodTreeSentinal
= w->visitRoot(compileRoots(t)->methodTreeSentinal());
bootImage->virtualThunks = w->visitRoot(compileRoots(t)->virtualThunks());
}
2014-07-11 15:50:18 +00:00
virtual void normalizeVirtualThunks(Thread* t)
{
GcWordArray* a = compileRoots(t)->virtualThunks();
2014-07-11 15:47:57 +00:00
for (unsigned i = 0; i < a->length(); i += 2) {
2014-06-29 04:57:07 +00:00
if (a->body()[i]) {
a->body()[i]
2014-02-25 22:46:35 +00:00
-= reinterpret_cast<uintptr_t>(codeAllocator.memory.begin());
}
}
}
2014-07-11 15:50:18 +00:00
virtual unsigned* makeCallTable(Thread* t, HeapWalker* w)
{
2009-06-01 03:16:58 +00:00
bootImage->codeSize = codeAllocator.offset;
bootImage->callCount = callTableSize;
2014-07-11 15:50:18 +00:00
unsigned* table = static_cast<unsigned*>(
t->m->heap->allocate(callTableSize * sizeof(unsigned) * 2));
2008-12-02 02:38:00 +00:00
unsigned index = 0;
GcArray* callTable = compileRoots(t)->callTable();
2014-06-29 04:57:07 +00:00
for (unsigned i = 0; i < callTable->length(); ++i) {
2014-07-11 15:47:57 +00:00
for (GcCallNode* p = cast<GcCallNode>(t, callTable->body()[i]); p;
p = p->next()) {
table[index++]
= targetVW(p->address() - reinterpret_cast<uintptr_t>(
codeAllocator.memory.begin()));
2014-02-25 22:46:35 +00:00
table[index++] = targetVW(
w->map()->find(p->target())
| (static_cast<unsigned>(p->flags()) << TargetBootShift));
2008-12-02 02:38:00 +00:00
}
}
2008-12-02 02:38:00 +00:00
return table;
}
2014-02-25 22:46:35 +00:00
virtual void boot(Thread* t, BootImage* image, uint8_t* code)
{
#ifndef AVIAN_AOT_ONLY
2014-02-25 22:46:35 +00:00
if (codeAllocator.memory.begin() == 0) {
codeAllocator.memory = Memory::allocate(ExecutableAreaSizeInBytes,
Memory::ReadWriteExecute);
expect(t, codeAllocator.memory.begin());
2009-06-01 03:16:58 +00:00
}
#endif
if (image and code) {
local::boot(static_cast<MyThread*>(t), image, code);
2008-12-02 02:38:00 +00:00
} else {
roots = makeCompileRoots(t, 0, 0, 0, 0, 0, 0, 0, 0, 0);
{
GcArray* ct = makeArray(t, 128);
// sequence point, for gc (don't recombine statements)
2014-06-25 20:38:13 +00:00
compileRoots(t)->setCallTable(t, ct);
}
2014-02-25 22:46:35 +00:00
GcTreeNode* tree = makeTreeNode(t, 0, 0, 0);
2014-06-25 20:38:13 +00:00
compileRoots(t)->setMethodTreeSentinal(t, tree);
compileRoots(t)->setMethodTree(t, tree);
tree->setLeft(t, tree);
tree->setRight(t, tree);
}
2013-01-29 17:23:22 +00:00
#ifdef AVIAN_AOT_ONLY
thunks = bootThunks;
#else
local::compileThunks(static_cast<MyThread*>(t), &codeAllocator);
2014-07-11 15:50:18 +00:00
if (not(image and code)) {
bootThunks = thunks;
}
2013-01-29 17:23:22 +00:00
#endif
2008-12-02 02:38:00 +00:00
segFaultHandler.m = t->m;
2014-07-11 15:50:18 +00:00
expect(
t,
signals.registerHandler(SignalRegistrar::SegFault, &segFaultHandler));
divideByZeroHandler.m = t->m;
2014-07-11 15:50:18 +00:00
expect(t,
signals.registerHandler(SignalRegistrar::DivideByZero,
&divideByZeroHandler));
2008-11-23 23:58:01 +00:00
}
2009-05-03 20:57:11 +00:00
2014-07-11 15:50:18 +00:00
virtual void callWithCurrentContinuation(Thread* t, object receiver)
{
if (Continuations) {
local::callWithCurrentContinuation(static_cast<MyThread*>(t), receiver);
2009-05-23 22:15:06 +00:00
} else {
abort(t);
2009-05-23 22:15:06 +00:00
}
2009-05-03 20:57:11 +00:00
}
2014-07-11 15:50:18 +00:00
virtual void dynamicWind(Thread* t, object before, object thunk, object after)
2009-05-03 20:57:11 +00:00
{
if (Continuations) {
local::dynamicWind(static_cast<MyThread*>(t), before, thunk, after);
2009-05-23 22:15:06 +00:00
} else {
abort(t);
}
2009-05-23 22:15:06 +00:00
}
2009-05-06 00:29:05 +00:00
2014-07-11 15:47:57 +00:00
virtual void feedResultToContinuation(Thread* t,
GcContinuation* continuation,
2009-05-23 22:15:06 +00:00
object result)
{
if (Continuations) {
2014-06-29 03:50:32 +00:00
callContinuation(static_cast<MyThread*>(t), continuation, result, 0);
} else {
abort(t);
}
2009-05-23 22:15:06 +00:00
}
2009-05-06 00:29:05 +00:00
2014-07-11 15:47:57 +00:00
virtual void feedExceptionToContinuation(Thread* t,
GcContinuation* continuation,
GcThrowable* exception)
2009-05-23 22:15:06 +00:00
{
if (Continuations) {
2014-06-29 04:57:07 +00:00
callContinuation(static_cast<MyThread*>(t), continuation, 0, exception);
} else {
abort(t);
}
2009-05-06 00:29:05 +00:00
}
2014-07-11 15:50:18 +00:00
virtual void walkContinuationBody(Thread* t,
Heap::Walker* w,
object o,
2009-05-03 20:57:11 +00:00
unsigned start)
{
if (Continuations) {
2014-07-11 15:47:57 +00:00
local::walkContinuationBody(
static_cast<MyThread*>(t), w, cast<GcContinuation>(t, o), start);
} else {
abort(t);
}
2009-05-03 20:57:11 +00:00
}
2014-05-29 04:17:25 +00:00
System* s;
2014-02-22 00:06:17 +00:00
SignalRegistrar signals;
Allocator* allocator;
GcCompileRoots* roots;
BootImage* bootImage;
uintptr_t* heapImage;
uint8_t* codeImage;
unsigned codeImageSize;
SignalHandler segFaultHandler;
SignalHandler divideByZeroHandler;
FixedAllocator codeAllocator;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
ThunkCollection thunks;
ThunkCollection bootThunks;
unsigned callTableSize;
bool useNativeFeatures;
void* thunkTable[dummyIndex + 1];
2012-05-02 15:49:31 +00:00
CompilationHandlerList* compilationHandlers;
};
2014-07-11 15:50:18 +00:00
const char* stringOrNull(const char* str)
{
if (str) {
return str;
} else {
return "(null)";
}
}
2014-07-11 15:50:18 +00:00
size_t stringOrNullSize(const char* str)
{
return strlen(stringOrNull(str));
}
2014-07-11 15:50:18 +00:00
void logCompile(MyThread* t,
const void* code,
unsigned size,
const char* class_,
const char* name,
const char* spec)
2012-05-02 15:49:31 +00:00
{
static bool open = false;
if (not open) {
open = true;
const char* path = findProperty(t, "avian.jit.log");
if (path) {
compileLog = vm::fopen(path, "wb");
} else if (DebugCompile) {
compileLog = stderr;
}
}
if (compileLog) {
2014-07-11 15:50:18 +00:00
fprintf(compileLog,
"%p,%p %s.%s%s\n",
code,
static_cast<const uint8_t*>(code) + size,
class_,
name,
spec);
2012-05-02 15:49:31 +00:00
}
2013-12-19 05:25:23 +00:00
size_t nameLength = stringOrNullSize(class_) + stringOrNullSize(name)
+ stringOrNullSize(spec) + 2;
THREAD_RUNTIME_ARRAY(t, char, completeName, nameLength);
2013-12-19 05:25:23 +00:00
sprintf(RUNTIME_ARRAY_BODY(completeName),
"%s.%s%s",
stringOrNull(class_),
stringOrNull(name),
stringOrNull(spec));
2012-05-02 15:49:31 +00:00
MyProcessor* p = static_cast<MyProcessor*>(t->m->processor);
2014-07-11 15:50:18 +00:00
for (CompilationHandlerList* h = p->compilationHandlers; h; h = h->next) {
h->handler->compiled(code, 0, 0, RUNTIME_ARRAY_BODY(completeName));
2012-05-02 15:49:31 +00:00
}
}
2014-07-11 15:50:18 +00:00
void* compileMethod2(MyThread* t, void* ip)
{
GcCallNode* node = findCallNode(t, ip);
GcMethod* target = node->target();
PROTECT(t, node);
PROTECT(t, target);
t->trace->targetMethod = target;
THREAD_RESOURCE0(t, static_cast<MyThread*>(t)->trace->targetMethod = 0);
compile(t, codeAllocator(t), 0, target);
uint8_t* updateIp = static_cast<uint8_t*>(ip);
MyProcessor* p = processor(t);
bool updateCaller = updateIp < p->codeImage
2014-07-11 15:50:18 +00:00
or updateIp >= p->codeImage + p->codeImageSize;
uintptr_t address;
2014-05-29 04:17:25 +00:00
if (target->flags() & ACC_NATIVE) {
address = useLongJump(t, reinterpret_cast<uintptr_t>(ip))
2014-07-11 15:50:18 +00:00
or (not updateCaller)
? bootNativeThunk(t)
: nativeThunk(t);
} else {
address = methodAddress(t, target);
}
if (updateCaller) {
avian::codegen::lir::UnaryOperation op;
if (node->flags() & TraceElement::LongCall) {
if (node->flags() & TraceElement::TailCall) {
op = avian::codegen::lir::AlignedLongJump;
} else {
op = avian::codegen::lir::AlignedLongCall;
}
} else if (node->flags() & TraceElement::TailCall) {
op = avian::codegen::lir::AlignedJump;
} else {
op = avian::codegen::lir::AlignedCall;
}
updateCall(t, op, updateIp, reinterpret_cast<void*>(address));
}
return reinterpret_cast<void*>(address);
}
2014-07-11 15:50:18 +00:00
bool isThunk(MyProcessor::ThunkCollection* thunks, void* ip)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
uint8_t* thunkStart = thunks->default_.start;
2014-07-11 15:50:18 +00:00
uint8_t* thunkEnd = thunks->table.start + (thunks->table.length * ThunkCount);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
return (reinterpret_cast<uintptr_t>(ip)
>= reinterpret_cast<uintptr_t>(thunkStart)
and reinterpret_cast<uintptr_t>(ip)
2014-07-11 15:50:18 +00:00
< reinterpret_cast<uintptr_t>(thunkEnd));
}
2014-07-11 15:50:18 +00:00
bool isThunk(MyThread* t, void* ip)
{
MyProcessor* p = processor(t);
return isThunk(&(p->thunks), ip) or isThunk(&(p->bootThunks), ip);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
}
2014-07-11 15:50:18 +00:00
bool isThunkUnsafeStack(MyProcessor::Thunk* thunk, void* ip)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
return reinterpret_cast<uintptr_t>(ip)
2014-07-11 15:50:18 +00:00
>= reinterpret_cast<uintptr_t>(thunk->start)
and reinterpret_cast<uintptr_t>(ip)
< reinterpret_cast<uintptr_t>(thunk->start
+ thunk->frameSavedOffset);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
}
2014-07-11 15:50:18 +00:00
bool isThunkUnsafeStack(MyProcessor::ThunkCollection* thunks, void* ip)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
const unsigned NamedThunkCount = 5;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
MyProcessor::Thunk table[NamedThunkCount + ThunkCount];
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
table[0] = thunks->default_;
table[1] = thunks->defaultVirtual;
table[2] = thunks->native;
table[3] = thunks->aioob;
table[4] = thunks->stackOverflow;
2014-05-29 04:17:25 +00:00
for (unsigned i = 0; i < ThunkCount; ++i) {
2014-07-11 15:50:18 +00:00
new (table + NamedThunkCount + i)
MyProcessor::Thunk(thunks->table.start + (i * thunks->table.length),
thunks->table.frameSavedOffset,
thunks->table.length);
}
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
for (unsigned i = 0; i < NamedThunkCount + ThunkCount; ++i) {
if (isThunkUnsafeStack(table + i, ip)) {
return true;
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
}
}
return false;
}
2014-07-11 15:50:18 +00:00
bool isVirtualThunk(MyThread* t, void* ip)
{
GcWordArray* a = compileRoots(t)->virtualThunks();
2014-07-11 15:47:57 +00:00
for (unsigned i = 0; i < a->length(); i += 2) {
2014-06-29 04:57:07 +00:00
uintptr_t start = a->body()[i];
uintptr_t end = start + a->body()[i + 1];
if (reinterpret_cast<uintptr_t>(ip) >= start
2014-07-11 15:50:18 +00:00
and reinterpret_cast<uintptr_t>(ip) < end) {
return true;
}
}
return false;
}
2014-07-11 15:50:18 +00:00
bool isThunkUnsafeStack(MyThread* t, void* ip)
{
MyProcessor* p = processor(t);
2014-07-11 15:50:18 +00:00
return isThunk(t, ip) and (isThunkUnsafeStack(&(p->thunks), ip)
or isThunkUnsafeStack(&(p->bootThunks), ip));
}
2014-07-11 15:47:57 +00:00
GcCallNode* findCallNode(MyThread* t, void* address)
{
2008-12-02 02:38:00 +00:00
if (DebugCallTable) {
fprintf(stderr, "find call node %p\n", address);
}
// we must use a version of the call table at least as recent as the
// compiled form of the method containing the specified address (see
// compile(MyThread*, Allocator*, BootContext*, object)):
loadMemoryBarrier();
GcArray* table = compileRoots(t)->callTable();
2008-12-02 02:38:00 +00:00
intptr_t key = reinterpret_cast<intptr_t>(address);
2014-06-29 04:57:07 +00:00
unsigned index = static_cast<uintptr_t>(key) & (table->length() - 1);
2014-07-11 15:47:57 +00:00
for (GcCallNode* n = cast<GcCallNode>(t, table->body()[index]); n;
n = n->next()) {
intptr_t k = n->address();
2008-12-02 02:38:00 +00:00
if (k == key) {
return n;
}
}
2008-12-02 02:38:00 +00:00
return 0;
}
2014-07-11 15:47:57 +00:00
GcArray* resizeTable(MyThread* t, GcArray* oldTable, unsigned newLength)
2008-12-02 02:38:00 +00:00
{
PROTECT(t, oldTable);
GcCallNode* oldNode = 0;
2008-12-02 02:38:00 +00:00
PROTECT(t, oldNode);
2008-08-16 18:46:14 +00:00
2014-06-29 04:57:07 +00:00
GcArray* newTable = makeArray(t, newLength);
2008-12-02 02:38:00 +00:00
PROTECT(t, newTable);
2014-06-29 04:57:07 +00:00
for (unsigned i = 0; i < oldTable->length(); ++i) {
2014-07-11 15:47:57 +00:00
for (oldNode = cast<GcCallNode>(t, oldTable->body()[i]); oldNode;
oldNode = oldNode->next()) {
intptr_t k = oldNode->address();
2008-12-02 02:38:00 +00:00
unsigned index = k & (newLength - 1);
2014-07-11 15:47:57 +00:00
GcCallNode* newNode
= makeCallNode(t,
oldNode->address(),
oldNode->target(),
oldNode->flags(),
cast<GcCallNode>(t, newTable->body()[index]));
2008-12-02 02:38:00 +00:00
newTable->setBodyElement(t, index, newNode);
2008-12-02 02:38:00 +00:00
}
}
return newTable;
}
2014-07-11 15:47:57 +00:00
GcArray* insertCallNode(MyThread* t,
GcArray* table,
unsigned* size,
GcCallNode* node)
2008-12-02 02:38:00 +00:00
{
if (DebugCallTable) {
2014-07-11 15:47:57 +00:00
fprintf(stderr,
"insert call node %p\n",
2014-06-29 04:57:07 +00:00
reinterpret_cast<void*>(node->address()));
2008-12-02 02:38:00 +00:00
}
PROTECT(t, table);
PROTECT(t, node);
2014-07-11 15:50:18 +00:00
++(*size);
2008-12-02 02:38:00 +00:00
2014-06-29 04:57:07 +00:00
if (*size >= table->length() * 2) {
table = resizeTable(t, table, table->length() * 2);
2008-12-02 02:38:00 +00:00
}
2014-06-29 04:57:07 +00:00
intptr_t key = node->address();
unsigned index = static_cast<uintptr_t>(key) & (table->length() - 1);
2008-12-02 02:38:00 +00:00
2014-06-25 20:38:13 +00:00
node->setNext(t, cast<GcCallNode>(t, table->body()[index]));
table->setBodyElement(t, index, node);
2008-12-02 02:38:00 +00:00
return table;
}
2014-07-11 15:47:57 +00:00
GcHashMap* makeClassMap(Thread* t,
unsigned* table,
unsigned count,
uintptr_t* heap)
2008-12-02 02:38:00 +00:00
{
2014-06-28 20:41:27 +00:00
GcArray* array = makeArray(t, nextPowerOfTwo(count));
2014-05-29 04:17:25 +00:00
GcHashMap* map = makeHashMap(t, 0, array);
2008-12-02 02:38:00 +00:00
PROTECT(t, map);
2014-05-29 04:17:25 +00:00
2008-12-02 02:38:00 +00:00
for (unsigned i = 0; i < count; ++i) {
2014-06-29 04:57:07 +00:00
GcClass* c = cast<GcClass>(t, bootObject(heap, table[i]));
hashMapInsert(t, map, c->name(), c, byteArrayHash);
2008-12-02 02:38:00 +00:00
}
return map;
}
2014-07-11 15:47:57 +00:00
GcArray* makeStaticTableArray(Thread* t,
unsigned* bootTable,
unsigned bootCount,
unsigned* appTable,
unsigned appCount,
uintptr_t* heap)
2008-12-02 02:38:00 +00:00
{
2014-06-29 04:57:07 +00:00
GcArray* array = makeArray(t, bootCount + appCount);
2014-05-29 04:17:25 +00:00
for (unsigned i = 0; i < bootCount; ++i) {
2014-07-11 15:47:57 +00:00
array->setBodyElement(
t, i, cast<GcClass>(t, bootObject(heap, bootTable[i]))->staticTable());
}
for (unsigned i = 0; i < appCount; ++i) {
2014-07-11 15:47:57 +00:00
array->setBodyElement(
t,
(bootCount + i),
cast<GcClass>(t, bootObject(heap, appTable[i]))->staticTable());
2008-12-02 02:38:00 +00:00
}
return array;
}
2014-07-11 15:47:57 +00:00
GcHashMap* makeStringMap(Thread* t,
unsigned* table,
unsigned count,
uintptr_t* heap)
2008-12-02 02:38:00 +00:00
{
2014-06-28 20:41:27 +00:00
GcArray* array = makeArray(t, nextPowerOfTwo(count));
2014-06-25 20:38:13 +00:00
GcHashMap* map = makeWeakHashMap(t, 0, array)->as<GcHashMap>(t);
2008-12-02 02:38:00 +00:00
PROTECT(t, map);
2014-05-29 04:17:25 +00:00
2008-12-02 02:38:00 +00:00
for (unsigned i = 0; i < count; ++i) {
object s = bootObject(heap, table[i]);
2014-06-25 20:38:13 +00:00
hashMapInsert(t, map, s, 0, stringHash);
2008-12-02 02:38:00 +00:00
}
return map;
}
2014-07-11 15:47:57 +00:00
GcArray* makeCallTable(MyThread* t,
uintptr_t* heap,
unsigned* calls,
unsigned count,
uintptr_t base)
2008-12-02 02:38:00 +00:00
{
2014-06-29 04:57:07 +00:00
GcArray* table = makeArray(t, nextPowerOfTwo(count));
2008-12-02 02:38:00 +00:00
PROTECT(t, table);
unsigned size = 0;
for (unsigned i = 0; i < count; ++i) {
unsigned address = calls[i * 2];
unsigned target = calls[(i * 2) + 1];
2014-07-11 15:47:57 +00:00
GcCallNode* node
= makeCallNode(t,
base + address,
cast<GcMethod>(t, bootObject(heap, target & BootMask)),
target >> BootShift,
0);
2008-12-02 02:38:00 +00:00
table = insertCallNode(t, table, &size, node);
}
return table;
}
2014-07-11 15:50:18 +00:00
void fixupHeap(MyThread* t UNUSED,
uintptr_t* map,
unsigned size,
uintptr_t* heap)
2008-12-02 02:38:00 +00:00
{
for (unsigned word = 0; word < size; ++word) {
uintptr_t w = map[word];
if (w) {
for (unsigned bit = 0; bit < BitsPerWord; ++bit) {
if (w & (static_cast<uintptr_t>(1) << bit)) {
unsigned index = indexOf(word, bit);
2008-12-02 02:38:00 +00:00
uintptr_t* p = heap + index;
assertT(t, *p);
2014-05-29 04:17:25 +00:00
2008-12-02 02:38:00 +00:00
uintptr_t number = *p & BootMask;
uintptr_t mark = *p >> BootShift;
if (number) {
*p = reinterpret_cast<uintptr_t>(heap + (number - 1)) | mark;
if (false) {
fprintf(stderr,
"fixup %d: %d 0x%x\n",
index,
static_cast<unsigned>(number),
static_cast<unsigned>(*p));
}
2008-12-02 02:38:00 +00:00
} else {
*p = mark;
}
}
}
}
}
}
2014-07-11 15:47:57 +00:00
void resetClassRuntimeState(Thread* t,
GcClass* c,
uintptr_t* heap,
unsigned heapSize)
{
2014-06-29 04:57:07 +00:00
c->runtimeDataIndex() = 0;
2014-06-29 04:57:07 +00:00
if (c->arrayElementSize() == 0) {
GcSingleton* staticTable = c->staticTable()->as<GcSingleton>(t);
if (staticTable) {
for (unsigned i = 0; i < singletonCount(t, staticTable); ++i) {
if (singletonIsObject(t, staticTable, i)
2014-07-11 15:50:18 +00:00
and (reinterpret_cast<uintptr_t*>(
singletonObject(t, staticTable, i)) < heap
or reinterpret_cast<uintptr_t*>(singletonObject(
t, staticTable, i)) > heap + heapSize)) {
singletonObject(t, staticTable, i) = 0;
}
}
}
}
2014-06-29 04:57:07 +00:00
if (GcArray* mtable = cast<GcArray>(t, c->methodTable())) {
PROTECT(t, mtable);
for (unsigned i = 0; i < mtable->length(); ++i) {
GcMethod* m = cast<GcMethod>(t, mtable->body()[i]);
2014-06-29 04:57:07 +00:00
m->nativeID() = 0;
m->runtimeDataIndex() = 0;
2014-06-29 04:57:07 +00:00
if (m->vmFlags() & ClassInitFlag) {
c->vmFlags() |= NeedInitFlag;
c->vmFlags() &= ~InitErrorFlag;
}
}
}
2014-06-29 04:57:07 +00:00
t->m->processor->initVtable(t, c);
}
2014-07-11 15:47:57 +00:00
void resetRuntimeState(Thread* t,
GcHashMap* map,
uintptr_t* heap,
unsigned heapSize)
{
for (HashMapIterator it(t, map); it.hasMore();) {
2014-07-11 15:47:57 +00:00
resetClassRuntimeState(
t, cast<GcClass>(t, it.next()->second()), heap, heapSize);
}
}
2014-07-11 15:47:57 +00:00
void fixupMethods(Thread* t,
GcHashMap* map,
BootImage* image UNUSED,
uint8_t* code)
2008-12-02 02:38:00 +00:00
{
for (HashMapIterator it(t, map); it.hasMore();) {
2014-06-29 04:57:07 +00:00
GcClass* c = cast<GcClass>(t, it.next()->second());
2008-12-02 02:38:00 +00:00
2014-06-29 04:57:07 +00:00
if (GcArray* mtable = cast<GcArray>(t, c->methodTable())) {
PROTECT(t, mtable);
for (unsigned i = 0; i < mtable->length(); ++i) {
GcMethod* method = cast<GcMethod>(t, mtable->body()[i]);
2014-05-29 04:17:25 +00:00
if (method->code()) {
2014-07-11 15:47:57 +00:00
assertT(t,
methodCompiled(t, method)
<= static_cast<int32_t>(image->codeSize));
2008-12-02 02:38:00 +00:00
2014-07-11 15:47:57 +00:00
method->code()->compiled() = methodCompiled(t, method)
+ reinterpret_cast<uintptr_t>(code);
2008-12-02 02:38:00 +00:00
if (DebugCompile) {
2014-07-11 15:47:57 +00:00
logCompile(static_cast<MyThread*>(t),
reinterpret_cast<uint8_t*>(methodCompiled(t, method)),
methodCompiledSize(t, method),
reinterpret_cast<char*>(
method->class_()->name()->body().begin()),
reinterpret_cast<char*>(method->name()->body().begin()),
reinterpret_cast<char*>(method->spec()->body().begin()));
2008-12-02 02:38:00 +00:00
}
}
}
}
2014-06-29 04:57:07 +00:00
t->m->processor->initVtable(t, c);
2008-12-02 02:38:00 +00:00
}
}
2014-07-11 15:50:18 +00:00
MyProcessor::Thunk thunkToThunk(const BootImage::Thunk& thunk, uint8_t* base)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
2014-07-11 15:50:18 +00:00
return MyProcessor::Thunk(
base + thunk.start, thunk.frameSavedOffset, thunk.length);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
}
2014-07-11 15:50:18 +00:00
void findThunks(MyThread* t, BootImage* image, uint8_t* code)
2008-12-02 02:38:00 +00:00
{
MyProcessor* p = processor(t);
2014-05-29 04:17:25 +00:00
p->bootThunks.default_ = thunkToThunk(image->thunks.default_, code);
p->bootThunks.defaultVirtual
2014-07-11 15:50:18 +00:00
= thunkToThunk(image->thunks.defaultVirtual, code);
p->bootThunks.native = thunkToThunk(image->thunks.native, code);
p->bootThunks.aioob = thunkToThunk(image->thunks.aioob, code);
2014-07-11 15:50:18 +00:00
p->bootThunks.stackOverflow = thunkToThunk(image->thunks.stackOverflow, code);
p->bootThunks.table = thunkToThunk(image->thunks.table, code);
2008-12-02 02:38:00 +00:00
}
2014-07-11 15:50:18 +00:00
void fixupVirtualThunks(MyThread* t, uint8_t* code)
{
GcWordArray* a = compileRoots(t)->virtualThunks();
2014-07-11 15:47:57 +00:00
for (unsigned i = 0; i < a->length(); i += 2) {
2014-06-29 04:57:07 +00:00
if (a->body()[i]) {
a->body()[i] += reinterpret_cast<uintptr_t>(code);
}
}
}
2014-07-11 15:50:18 +00:00
void boot(MyThread* t, BootImage* image, uint8_t* code)
2008-12-02 02:38:00 +00:00
{
assertT(t, image->magic == BootImage::Magic);
2008-12-02 02:38:00 +00:00
unsigned* bootClassTable = reinterpret_cast<unsigned*>(image + 1);
unsigned* appClassTable = bootClassTable + image->bootClassCount;
unsigned* stringTable = appClassTable + image->appClassCount;
2008-12-02 02:38:00 +00:00
unsigned* callTable = stringTable + image->stringCount;
2014-07-11 15:50:18 +00:00
uintptr_t* heapMap = reinterpret_cast<uintptr_t*>(
padWord(reinterpret_cast<uintptr_t>(callTable + (image->callCount * 2))));
2014-07-11 15:50:18 +00:00
unsigned heapMapSizeInWords
= ceilingDivide(heapMapSize(image->heapSize), BytesPerWord);
2008-12-02 02:38:00 +00:00
uintptr_t* heap = heapMap + heapMapSizeInWords;
MyProcessor* p = static_cast<MyProcessor*>(t->m->processor);
t->heapImage = p->heapImage = heap;
if (false) {
fprintf(stderr,
"heap from %p to %p\n",
heap,
heap + ceilingDivide(image->heapSize, BytesPerWord));
}
2008-12-02 02:38:00 +00:00
t->codeImage = p->codeImage = code;
p->codeImageSize = image->codeSize;
2008-12-02 02:38:00 +00:00
if (false) {
fprintf(stderr, "code from %p to %p\n", code, code + image->codeSize);
}
2014-05-29 04:17:25 +00:00
if (not image->initialized) {
fixupHeap(t, heapMap, heapMapSizeInWords, heap);
}
2014-05-29 04:17:25 +00:00
2008-12-02 02:38:00 +00:00
t->m->heap->setImmortalHeap(heap, image->heapSize / BytesPerWord);
2014-06-28 23:24:24 +00:00
t->m->types = reinterpret_cast<GcArray*>(bootObject(heap, image->types));
t->m->roots = GcRoots::makeZeroed(t);
2014-07-11 15:47:57 +00:00
roots(t)->setBootLoader(
t, cast<GcClassLoader>(t, bootObject(heap, image->bootLoader)));
roots(t)->setAppLoader(
t, cast<GcClassLoader>(t, bootObject(heap, image->appLoader)));
2008-12-02 02:38:00 +00:00
p->roots = GcCompileRoots::makeZeroed(t);
2014-05-29 04:17:25 +00:00
2014-07-11 15:47:57 +00:00
compileRoots(t)->setMethodTree(
t, cast<GcTreeNode>(t, bootObject(heap, image->methodTree)));
compileRoots(t)->setMethodTreeSentinal(
t, cast<GcTreeNode>(t, bootObject(heap, image->methodTreeSentinal)));
2008-12-02 02:38:00 +00:00
2014-07-11 15:47:57 +00:00
compileRoots(t)->setVirtualThunks(
t, cast<GcWordArray>(t, bootObject(heap, image->virtualThunks)));
2014-06-30 01:44:41 +00:00
{
2014-07-11 15:47:57 +00:00
GcHashMap* map
= makeClassMap(t, bootClassTable, image->bootClassCount, heap);
2014-06-30 01:44:41 +00:00
// sequence point, for gc (don't recombine statements)
roots(t)->bootLoader()->setMap(t, map);
}
2014-07-11 15:47:57 +00:00
roots(t)->bootLoader()->as<GcSystemClassLoader>(t)->finder()
= t->m->bootFinder;
2014-06-30 01:44:41 +00:00
{
GcHashMap* map = makeClassMap(t, appClassTable, image->appClassCount, heap);
// sequence point, for gc (don't recombine statements)
roots(t)->appLoader()->setMap(t, map);
}
2014-06-30 01:44:41 +00:00
roots(t)->appLoader()->as<GcSystemClassLoader>(t)->finder() = t->m->appFinder;
{
2014-06-25 20:38:13 +00:00
GcHashMap* map = makeStringMap(t, stringTable, image->stringCount, heap);
// sequence point, for gc (don't recombine statements)
2014-06-25 20:38:13 +00:00
roots(t)->setStringMap(t, map);
}
2008-12-02 02:38:00 +00:00
p->callTableSize = image->callCount;
{
GcArray* ct = makeCallTable(t,
heap,
callTable,
image->callCount,
reinterpret_cast<uintptr_t>(code));
// sequence point, for gc (don't recombine statements)
2014-06-25 20:38:13 +00:00
compileRoots(t)->setCallTable(t, ct);
}
2008-12-02 02:38:00 +00:00
{
2014-07-11 15:47:57 +00:00
GcArray* staticTableArray = makeStaticTableArray(t,
bootClassTable,
image->bootClassCount,
appClassTable,
image->appClassCount,
heap);
// sequence point, for gc (don't recombine statements)
compileRoots(t)->setStaticTableArray(t, staticTableArray);
}
2014-05-29 04:17:25 +00:00
findThunks(t, image, code);
2008-12-02 02:38:00 +00:00
if (image->initialized) {
2014-07-11 15:47:57 +00:00
resetRuntimeState(t,
cast<GcHashMap>(t, roots(t)->bootLoader()->map()),
heap,
image->heapSize);
2014-07-11 15:47:57 +00:00
resetRuntimeState(t,
cast<GcHashMap>(t, roots(t)->appLoader()->map()),
heap,
image->heapSize);
2014-06-28 23:24:24 +00:00
for (unsigned i = 0; i < t->m->types->length(); ++i) {
2014-07-11 15:47:57 +00:00
resetClassRuntimeState(
t, type(t, static_cast<Gc::Type>(i)), heap, image->heapSize);
}
} else {
fixupVirtualThunks(t, code);
2014-07-11 15:47:57 +00:00
fixupMethods(
t, cast<GcHashMap>(t, roots(t)->bootLoader()->map()), image, code);
2014-07-11 15:47:57 +00:00
fixupMethods(
t, cast<GcHashMap>(t, roots(t)->appLoader()->map()), image, code);
}
image->initialized = true;
2008-12-02 02:38:00 +00:00
2014-06-30 01:44:41 +00:00
GcHashMap* map = makeHashMap(t, 0, 0);
// sequence point, for gc (don't recombine statements)
2014-06-25 20:38:13 +00:00
roots(t)->setBootstrapClassMap(t, map);
2008-12-02 02:38:00 +00:00
}
2014-07-11 15:50:18 +00:00
intptr_t getThunk(MyThread* t, Thunk thunk)
{
MyProcessor* p = processor(t);
2014-05-29 04:17:25 +00:00
2014-07-11 15:50:18 +00:00
return reinterpret_cast<intptr_t>(p->thunks.table.start
+ (thunk * p->thunks.table.length));
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
}
#ifndef AVIAN_AOT_ONLY
void insertCallNode(MyThread* t, GcCallNode* node)
{
GcArray* newArray = insertCallNode(
t, compileRoots(t)->callTable(), &(processor(t)->callTableSize), node);
// sequence point, for gc (don't recombine statements)
compileRoots(t)->setCallTable(t, newArray);
}
2014-07-11 15:50:18 +00:00
BootImage::Thunk thunkToThunk(const MyProcessor::Thunk& thunk, uint8_t* base)
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
{
2014-07-11 15:50:18 +00:00
return BootImage::Thunk(
thunk.start - base, thunk.frameSavedOffset, thunk.length);
}
using avian::codegen::OperandInfo;
namespace lir = avian::codegen::lir;
2014-07-11 15:50:18 +00:00
void compileCall(MyThread* t, Context* c, ThunkIndex index, bool call = true)
{
avian::codegen::Assembler* a = c->assembler;
if (processor(t)->bootImage) {
lir::Memory table(t->arch->thread(), TARGET_THREAD_THUNKTABLE);
lir::Register scratch(t->arch->scratch());
a->apply(lir::Move,
2014-12-05 01:33:10 +00:00
OperandInfo(TargetBytesPerWord, lir::Operand::Type::Memory, &table),
OperandInfo(TargetBytesPerWord, lir::Operand::Type::RegisterPair, &scratch));
lir::Memory proc(scratch.low, index * TargetBytesPerWord);
a->apply(lir::Move,
2014-12-05 01:33:10 +00:00
OperandInfo(TargetBytesPerWord, lir::Operand::Type::Memory, &proc),
OperandInfo(TargetBytesPerWord, lir::Operand::Type::RegisterPair, &scratch));
2014-07-11 15:50:18 +00:00
a->apply(call ? lir::Call : lir::Jump,
2014-12-05 01:33:10 +00:00
OperandInfo(TargetBytesPerWord, lir::Operand::Type::RegisterPair, &scratch));
} else {
2014-07-11 15:50:18 +00:00
lir::Constant proc(new (&c->zone) avian::codegen::ResolvedPromise(
reinterpret_cast<intptr_t>(t->thunkTable[index])));
2014-07-11 15:50:18 +00:00
a->apply(call ? lir::LongCall : lir::LongJump,
2014-12-05 01:33:10 +00:00
OperandInfo(TargetBytesPerWord, lir::Operand::Type::Constant, &proc));
}
}
2014-07-11 15:50:18 +00:00
void compileThunks(MyThread* t, FixedAllocator* allocator)
{
MyProcessor* p = processor(t);
2014-07-11 15:50:18 +00:00
{
Context context(t);
avian::codegen::Assembler* a = context.assembler;
2014-05-29 04:17:25 +00:00
a->saveFrame(TARGET_THREAD_STACK, TARGET_THREAD_IP);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
p->thunks.default_.frameSavedOffset = a->length();
lir::Register thread(t->arch->thread());
2014-12-05 01:33:10 +00:00
a->pushFrame(1, TargetBytesPerWord, lir::Operand::Type::RegisterPair, &thread);
2014-05-29 04:17:25 +00:00
compileCall(t, &context, compileMethodIndex);
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
a->popFrame(t->arch->alignFrameSize(1));
lir::Register result(t->arch->returnLow());
a->apply(lir::Jump,
2014-12-05 01:33:10 +00:00
OperandInfo(TargetBytesPerWord, lir::Operand::Type::RegisterPair, &result));
2008-09-07 20:12:11 +00:00
p->thunks.default_.length = a->endBlock(false)->resolve(0, 0);
2014-07-11 15:50:18 +00:00
p->thunks.default_.start
= finish(t, allocator, a, "default", p->thunks.default_.length);
}
2014-07-11 15:50:18 +00:00
{
Context context(t);
avian::codegen::Assembler* a = context.assembler;
2014-05-29 04:17:25 +00:00
lir::Register class_(t->arch->virtualCallTarget());
2014-07-11 15:50:18 +00:00
lir::Memory virtualCallTargetSrc(
t->arch->stack(),
(t->arch->frameFooterSize() + t->arch->frameReturnAddressSize())
* TargetBytesPerWord);
2009-05-03 20:57:11 +00:00
a->apply(lir::Move,
2014-07-11 15:50:18 +00:00
OperandInfo(
2014-12-05 01:33:10 +00:00
TargetBytesPerWord, lir::Operand::Type::Memory, &virtualCallTargetSrc),
OperandInfo(TargetBytesPerWord, lir::Operand::Type::RegisterPair, &class_));
2009-05-03 20:57:11 +00:00
2014-07-11 15:50:18 +00:00
lir::Memory virtualCallTargetDst(t->arch->thread(),
TARGET_THREAD_VIRTUALCALLTARGET);
2009-05-03 20:57:11 +00:00
2014-07-11 15:50:18 +00:00
a->apply(
lir::Move,
2014-12-05 01:33:10 +00:00
OperandInfo(TargetBytesPerWord, lir::Operand::Type::RegisterPair, &class_),
2014-07-11 15:50:18 +00:00
OperandInfo(
2014-12-05 01:33:10 +00:00
TargetBytesPerWord, lir::Operand::Type::Memory, &virtualCallTargetDst));
lir::Register index(t->arch->virtualCallIndex());
2014-07-11 15:50:18 +00:00
lir::Memory virtualCallIndex(t->arch->thread(),
TARGET_THREAD_VIRTUALCALLINDEX);
2009-05-03 20:57:11 +00:00
2014-07-11 15:50:18 +00:00
a->apply(
lir::Move,
2014-12-05 01:33:10 +00:00
OperandInfo(TargetBytesPerWord, lir::Operand::Type::RegisterPair, &index),
OperandInfo(TargetBytesPerWord, lir::Operand::Type::Memory, &virtualCallIndex));
2014-05-29 04:17:25 +00:00
a->saveFrame(TARGET_THREAD_STACK, TARGET_THREAD_IP);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
p->thunks.defaultVirtual.frameSavedOffset = a->length();
lir::Register thread(t->arch->thread());
2014-12-05 01:33:10 +00:00
a->pushFrame(1, TargetBytesPerWord, lir::Operand::Type::RegisterPair, &thread);
compileCall(t, &context, compileVirtualMethodIndex);
2014-05-29 04:17:25 +00:00
support stack unwinding without using a frame pointer Previously, we unwound the stack by following the chain of frame pointers for normal returns, stack trace creation, and exception unwinding. On x86, this required reserving EBP/RBP for frame pointer duties, making it unavailable for general computation and requiring that it be explicitly saved and restored on entry and exit, respectively. On PowerPC, we use an ABI that makes the stack pointer double as a frame pointer, so it doesn't cost us anything. We've been using the same convention on ARM, but it doesn't match the native calling convention, which makes it unusable when we want to call native code from Java and pass arguments on the stack. So far, the ARM calling convention mismatch hasn't been an issue because we've never passed more arguments from Java to native code than would fit in registers. However, we must now pass an extra argument (the thread pointer) to e.g. divideLong so it can throw an exception on divide by zero, which means the last argument must be passed on the stack. This will clobber the linkage area we've been using to hold the frame pointer, so we need to stop using it. One solution would be to use the same convention on ARM as we do on x86, but this would introduce the same overhead of making a register unavailable for general use and extra code at method entry and exit. Instead, this commit removes the need for a frame pointer. Unwinding involves consulting a map of instruction offsets to frame sizes which is generated at compile time. This is necessary because stack trace creation can happen at any time due to Thread.getStackTrace being called by another thread, and the frame size varies during the execution of a method. So far, only x86(_64) is working, and continuations and tail call optimization are probably broken. More to come.
2011-01-17 02:05:05 +00:00
a->popFrame(t->arch->alignFrameSize(1));
lir::Register result(t->arch->returnLow());
a->apply(lir::Jump,
2014-12-05 01:33:10 +00:00
OperandInfo(TargetBytesPerWord, lir::Operand::Type::RegisterPair, &result));
p->thunks.defaultVirtual.length = a->endBlock(false)->resolve(0, 0);
2014-07-11 15:50:18 +00:00
p->thunks.defaultVirtual.start = finish(
t, allocator, a, "defaultVirtual", p->thunks.defaultVirtual.length);
}
2014-07-11 15:50:18 +00:00
{
Context context(t);
avian::codegen::Assembler* a = context.assembler;
a->saveFrame(TARGET_THREAD_STACK, TARGET_THREAD_IP);
2008-08-16 18:46:14 +00:00
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
p->thunks.native.frameSavedOffset = a->length();
lir::Register thread(t->arch->thread());
2014-12-05 01:33:10 +00:00
a->pushFrame(1, TargetBytesPerWord, lir::Operand::Type::RegisterPair, &thread);
compileCall(t, &context, invokeNativeIndex);
2014-05-29 04:17:25 +00:00
2014-07-11 15:50:18 +00:00
a->popFrameAndUpdateStackAndReturn(t->arch->alignFrameSize(1),
TARGET_THREAD_NEWSTACK);
2008-09-07 20:12:11 +00:00
p->thunks.native.length = a->endBlock(false)->resolve(0, 0);
2014-07-11 15:50:18 +00:00
p->thunks.native.start
= finish(t, allocator, a, "native", p->thunks.native.length);
}
2014-07-11 15:50:18 +00:00
{
Context context(t);
avian::codegen::Assembler* a = context.assembler;
a->saveFrame(TARGET_THREAD_STACK, TARGET_THREAD_IP);
2008-08-16 18:46:14 +00:00
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
p->thunks.aioob.frameSavedOffset = a->length();
lir::Register thread(t->arch->thread());
2014-12-05 01:33:10 +00:00
a->pushFrame(1, TargetBytesPerWord, lir::Operand::Type::RegisterPair, &thread);
compileCall(t, &context, throwArrayIndexOutOfBoundsIndex);
2008-09-07 20:12:11 +00:00
p->thunks.aioob.length = a->endBlock(false)->resolve(0, 0);
2014-07-11 15:50:18 +00:00
p->thunks.aioob.start
= finish(t, allocator, a, "aioob", p->thunks.aioob.length);
}
2014-07-11 15:50:18 +00:00
{
Context context(t);
avian::codegen::Assembler* a = context.assembler;
2014-05-29 04:17:25 +00:00
a->saveFrame(TARGET_THREAD_STACK, TARGET_THREAD_IP);
p->thunks.stackOverflow.frameSavedOffset = a->length();
lir::Register thread(t->arch->thread());
2014-12-05 01:33:10 +00:00
a->pushFrame(1, TargetBytesPerWord, lir::Operand::Type::RegisterPair, &thread);
compileCall(t, &context, throwStackOverflowIndex);
p->thunks.stackOverflow.length = a->endBlock(false)->resolve(0, 0);
2008-09-07 20:12:11 +00:00
2014-07-11 15:50:18 +00:00
p->thunks.stackOverflow.start = finish(
t, allocator, a, "stackOverflow", p->thunks.stackOverflow.length);
}
2014-07-11 15:50:18 +00:00
{
{
Context context(t);
avian::codegen::Assembler* a = context.assembler;
2008-11-23 23:58:01 +00:00
a->saveFrame(TARGET_THREAD_STACK, TARGET_THREAD_IP);
2008-11-28 04:44:04 +00:00
p->thunks.table.frameSavedOffset = a->length();
2008-11-28 04:44:04 +00:00
compileCall(t, &context, dummyIndex, false);
p->thunks.table.length = a->endBlock(false)->resolve(0, 0);
2014-07-11 15:50:18 +00:00
p->thunks.table.start = static_cast<uint8_t*>(allocator->allocate(
p->thunks.table.length * ThunkCount, TargetBytesPerWord));
2008-11-28 04:44:04 +00:00
}
uint8_t* start = p->thunks.table.start;
2014-07-11 15:50:18 +00:00
#define THUNK(s) \
{ \
Context context(t); \
avian::codegen::Assembler* a = context.assembler; \
\
a->saveFrame(TARGET_THREAD_STACK, TARGET_THREAD_IP); \
\
p->thunks.table.frameSavedOffset = a->length(); \
\
compileCall(t, &context, s##Index, false); \
\
expect(t, a->endBlock(false)->resolve(0, 0) <= p->thunks.table.length); \
\
a->setDestination(start); \
a->write(); \
\
logCompile(t, start, p->thunks.table.length, 0, #s, 0); \
\
start += p->thunks.table.length; \
}
#include "thunks.cpp"
#undef THUNK
}
BootImage* image = p->bootImage;
if (image) {
2014-02-25 22:46:35 +00:00
uint8_t* imageBase = p->codeAllocator.memory.begin();
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
image->thunks.default_ = thunkToThunk(p->thunks.default_, imageBase);
2014-07-11 15:50:18 +00:00
image->thunks.defaultVirtual
= thunkToThunk(p->thunks.defaultVirtual, imageBase);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
image->thunks.native = thunkToThunk(p->thunks.native, imageBase);
image->thunks.aioob = thunkToThunk(p->thunks.aioob, imageBase);
2014-07-11 15:50:18 +00:00
image->thunks.stackOverflow
= thunkToThunk(p->thunks.stackOverflow, imageBase);
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
image->thunks.table = thunkToThunk(p->thunks.table, imageBase);
}
}
uintptr_t aioobThunk(MyThread* t)
{
return reinterpret_cast<uintptr_t>(processor(t)->thunks.aioob.start);
}
uintptr_t stackOverflowThunk(MyThread* t)
{
return reinterpret_cast<uintptr_t>(processor(t)->thunks.stackOverflow.start);
}
#endif // not AVIAN_AOT_ONLY
2014-07-11 15:50:18 +00:00
MyProcessor* processor(MyThread* t)
2007-10-04 03:19:39 +00:00
{
2008-12-02 02:38:00 +00:00
return static_cast<MyProcessor*>(t->m->processor);
2007-12-09 22:45:43 +00:00
}
2007-12-30 22:24:48 +00:00
2014-07-11 15:50:18 +00:00
uintptr_t defaultThunk(MyThread* t)
{
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
return reinterpret_cast<uintptr_t>(processor(t)->thunks.default_.start);
}
2014-07-11 15:50:18 +00:00
uintptr_t bootDefaultThunk(MyThread* t)
{
return reinterpret_cast<uintptr_t>(processor(t)->bootThunks.default_.start);
}
2014-07-11 15:50:18 +00:00
uintptr_t defaultVirtualThunk(MyThread* t)
{
2014-07-11 15:50:18 +00:00
return reinterpret_cast<uintptr_t>(processor(t)->thunks.defaultVirtual.start);
}
2014-07-11 15:50:18 +00:00
uintptr_t nativeThunk(MyThread* t)
2008-04-09 19:08:13 +00:00
{
fix Thread.getStackTrace race conditions Implementing Thread.getStackTrace is tricky. A thread may interrupt another thread at any time to grab a stack trace, including while the latter is executing Java code, JNI code, helper thunks, VM code, or while transitioning between any of these. To create a stack trace we use several context fields associated with the target thread, including snapshots of the instruction pointer, stack pointer, and frame pointer. These fields must be current, accurate, and consistent with each other in order to get a reliable trace. Otherwise, we risk crashing the VM by trying to walk garbage stack frames or by misinterpreting the size and/or content of legitimate frames. This commit addresses sensitive transition points such as entering the helper thunks which bridge the transitions from Java to native code (where we must save the stack and frame registers for use from native code) and stack unwinding (where we must atomically update the thread context fields to indicate which frame we are unwinding to). When grabbing a trace for another thread, we determine what kind of code we caught the thread executing in and use that information to choose the thread context values with which to begin the trace. See MyProcessor::getStackTrace::Visitor::visit for details. In order to atomically update the thread context fields, we do the following: 1. Create a temporary "transition" object to serve as a staging area and populate it with the new field values. 2. Update a transition pointer in the thread object to point to the object created above. As long as this pointer is non-null, interrupting threads will use the context values in the staging object instead of those in the thread object. 3. Update the fields in the thread object. 4. Clear the transition pointer in the thread object. We use a memory barrier between each of these steps to ensure they are made visible to other threads in program order. See MyThread::doTransition for details.
2010-06-16 01:10:48 +00:00
return reinterpret_cast<uintptr_t>(processor(t)->thunks.native.start);
2008-04-09 19:08:13 +00:00
}
2014-07-11 15:50:18 +00:00
uintptr_t bootNativeThunk(MyThread* t)
{
return reinterpret_cast<uintptr_t>(processor(t)->bootThunks.native.start);
}
2014-07-11 15:50:18 +00:00
bool unresolved(MyThread* t, uintptr_t methodAddress)
{
return methodAddress == defaultThunk(t)
2014-07-11 15:50:18 +00:00
or methodAddress == bootDefaultThunk(t);
}
2014-07-11 15:50:18 +00:00
uintptr_t compileVirtualThunk(MyThread* t, unsigned index, unsigned* size)
{
Context context(t);
avian::codegen::Assembler* a = context.assembler;
avian::codegen::ResolvedPromise indexPromise(index);
lir::Constant indexConstant(&indexPromise);
lir::Register indexRegister(t->arch->virtualCallIndex());
2014-07-11 15:50:18 +00:00
a->apply(
lir::Move,
2014-12-05 01:33:10 +00:00
OperandInfo(TargetBytesPerWord, lir::Operand::Type::Constant, &indexConstant),
OperandInfo(TargetBytesPerWord, lir::Operand::Type::RegisterPair, &indexRegister));
2014-05-29 04:17:25 +00:00
2014-07-11 15:50:18 +00:00
avian::codegen::ResolvedPromise defaultVirtualThunkPromise(
defaultVirtualThunk(t));
lir::Constant thunk(&defaultVirtualThunkPromise);
a->apply(lir::Jump,
2014-12-05 01:33:10 +00:00
OperandInfo(TargetBytesPerWord, lir::Operand::Type::Constant, &thunk));
*size = a->endBlock(false)->resolve(0, 0);
2014-07-11 15:50:18 +00:00
uint8_t* start = static_cast<uint8_t*>(
codeAllocator(t)->allocate(*size, TargetBytesPerWord));
a->setDestination(start);
a->write();
const char* const virtualThunkBaseName = "virtualThunk";
const size_t virtualThunkBaseNameLength = strlen(virtualThunkBaseName);
const size_t maxIntStringLength = 10;
2014-07-11 15:50:18 +00:00
THREAD_RUNTIME_ARRAY(t,
char,
virtualThunkName,
virtualThunkBaseNameLength + maxIntStringLength);
2014-07-11 15:50:18 +00:00
sprintf(RUNTIME_ARRAY_BODY(virtualThunkName),
"%s%d",
virtualThunkBaseName,
index);
2012-06-02 21:43:42 +00:00
logCompile(t, start, *size, 0, RUNTIME_ARRAY_BODY(virtualThunkName), 0);
return reinterpret_cast<uintptr_t>(start);
}
2014-07-11 15:50:18 +00:00
uintptr_t virtualThunk(MyThread* t, unsigned index)
{
ACQUIRE(t, t->m->classLock);
GcWordArray* oldArray = compileRoots(t)->virtualThunks();
2014-07-11 15:47:57 +00:00
if (oldArray == 0 or oldArray->length() <= index * 2) {
2014-06-29 04:57:07 +00:00
GcWordArray* newArray = makeWordArray(t, nextPowerOfTwo((index + 1) * 2));
if (compileRoots(t)->virtualThunks()) {
2014-06-29 04:57:07 +00:00
memcpy(newArray->body().begin(),
oldArray->body().begin(),
oldArray->length() * BytesPerWord);
}
2014-06-25 20:38:13 +00:00
compileRoots(t)->setVirtualThunks(t, newArray);
2014-06-29 04:57:07 +00:00
oldArray = newArray;
}
2014-06-29 04:57:07 +00:00
if (oldArray->body()[index * 2] == 0) {
unsigned size;
uintptr_t thunk = compileVirtualThunk(t, index, &size);
2014-06-29 04:57:07 +00:00
oldArray->body()[index * 2] = thunk;
oldArray->body()[(index * 2) + 1] = size;
}
2014-06-29 04:57:07 +00:00
return oldArray->body()[index * 2];
}
2014-07-11 15:47:57 +00:00
void compile(MyThread* t,
FixedAllocator* allocator UNUSED,
2014-07-11 15:47:57 +00:00
BootContext* bootContext,
GcMethod* method)
2007-12-09 22:45:43 +00:00
{
PROTECT(t, method);
2007-12-09 22:45:43 +00:00
2014-05-29 04:17:25 +00:00
if (bootContext == 0 and method->flags() & ACC_STATIC) {
initClass(t, method->class_());
}
2007-12-09 22:45:43 +00:00
if (methodAddress(t, method) != defaultThunk(t)) {
return;
}
2007-12-09 22:45:43 +00:00
assertT(t, (method->flags() & ACC_NATIVE) == 0);
#ifdef AVIAN_AOT_ONLY
abort(t);
#else
// We must avoid acquiring any locks until after the first pass of
// compilation, since this pass may trigger classloading operations
// involving application classloaders and thus the potential for
// deadlock. To make this safe, we use a private clone of the
// method so that we won't be confused if another thread updates the
// original while we're working.
2007-12-11 00:48:09 +00:00
2014-05-29 04:17:25 +00:00
GcMethod* clone = methodClone(t, method);
loadMemoryBarrier();
if (methodAddress(t, method) != defaultThunk(t)) {
return;
}
PROTECT(t, clone);
Context context(t, bootContext, clone);
compile(t, &context);
2014-07-11 15:47:57 +00:00
{
GcExceptionHandlerTable* ehTable = cast<GcExceptionHandlerTable>(
t, clone->code()->exceptionHandlerTable());
if (ehTable) {
PROTECT(t, ehTable);
// resolve all exception handler catch types before we acquire
// the class lock:
2014-06-29 04:57:07 +00:00
for (unsigned i = 0; i < ehTable->length(); ++i) {
uint64_t handler = ehTable->body()[i];
if (exceptionHandlerCatchType(handler)) {
2014-07-11 15:50:18 +00:00
resolveClassInPool(t, clone, exceptionHandlerCatchType(handler) - 1);
}
}
}
}
ACQUIRE(t, t->m->classLock);
if (methodAddress(t, method) != defaultThunk(t)) {
return;
}
finish(t, allocator, &context);
2014-05-29 04:17:25 +00:00
if (DebugMethodTree) {
2014-07-11 15:50:18 +00:00
fprintf(stderr,
"insert method at %p\n",
reinterpret_cast<void*>(methodCompiled(t, clone)));
2007-12-11 00:48:09 +00:00
}
// We can't update the MethodCode field on the original method
// before it is placed into the method tree, since another thread
// might call the method, from which stack unwinding would fail
// (since there is not yet an entry in the method tree). However,
// we can't insert the original method into the tree before updating
// the MethodCode field on it since we rely on that field to
// determine its position in the tree. Therefore, we insert the
// clone in its place. Later, we'll replace the clone with the
// original to save memory.
GcTreeNode* newTree = treeInsert(t,
&(context.zone),
compileRoots(t)->methodTree(),
methodCompiled(t, clone),
clone,
compileRoots(t)->methodTreeSentinal(),
compareIpToMethodBounds);
// sequence point, for gc (don't recombine statements)
2014-06-25 20:38:13 +00:00
compileRoots(t)->setMethodTree(t, newTree);
storeStoreMemoryBarrier();
2014-06-25 20:38:13 +00:00
method->setCode(t, clone->code());
if (methodVirtual(t, method)) {
2014-06-29 04:57:07 +00:00
method->class_()->vtable()[method->offset()]
2014-07-11 15:47:57 +00:00
= reinterpret_cast<void*>(methodCompiled(t, clone));
}
rework VM exception handling; throw OOMEs when appropriate This rather large commit modifies the VM to use non-local returns to throw exceptions instead of simply setting Thread::exception and returning frame-by-frame as it used to. This has several benefits: * Functions no longer need to check Thread::exception after each call which might throw an exception (which would be especially tedious and error-prone now that any function which allocates objects directly or indirectly might throw an OutOfMemoryError) * There's no need to audit the code for calls to functions which previously did not throw exceptions but later do * Performance should be improved slightly due to both the reduced need for conditionals and because undwinding now occurs in a single jump instead of a series of returns The main disadvantages are: * Slightly higher overhead for entering and leaving the VM via the JNI and JDK methods * Non-local returns can make the code harder to read * We must be careful to register destructors for stack-allocated resources with the Thread so they can be called prior to a non-local return The non-local return implementation is similar to setjmp/longjmp, except it uses continuation-passing style to avoid the need for cooperation from the C/C++ compiler. Native C++ exceptions would have also been an option, but that would introduce a dependence on libstdc++, which we're trying to avoid for portability reasons. Finally, this commit ensures that the VM throws an OutOfMemoryError instead of aborting when it reaches its memory ceiling. Currently, we treat the ceiling as a soft limit and temporarily exceed it as necessary to allow garbage collection and certain internal allocations to succeed, but refuse to allocate any Java objects until the heap size drops back below the ceiling.
2010-12-27 22:55:23 +00:00
// we've compiled the method and inserted it into the tree without
// error, so we ensure that the executable area not be deallocated
// when we dispose of the context:
context.executableAllocator = 0;
2014-06-29 04:57:07 +00:00
treeUpdate(t,
compileRoots(t)->methodTree(),
2014-06-29 04:57:07 +00:00
methodCompiled(t, clone),
method,
compileRoots(t)->methodTreeSentinal(),
2014-06-29 04:57:07 +00:00
compareIpToMethodBounds);
#endif // not AVIAN_AOT_ONLY
}
2007-12-11 00:48:09 +00:00
2014-07-11 15:47:57 +00:00
GcCompileRoots* compileRoots(Thread* t)
{
return processor(static_cast<MyThread*>(t))->roots;
}
2014-02-25 22:15:37 +00:00
avian::util::FixedAllocator* codeAllocator(MyThread* t)
{
return &(processor(t)->codeAllocator);
}
2014-07-11 15:50:18 +00:00
} // namespace local
2014-07-11 15:50:18 +00:00
} // namespace
2007-12-09 22:45:43 +00:00
namespace vm {
2014-02-22 00:06:17 +00:00
Processor* makeProcessor(System* system,
Allocator* allocator,
const char* crashDumpDirectory,
bool useNativeFeatures)
{
return new (allocator->allocate(sizeof(local::MyProcessor)))
2014-07-11 15:50:18 +00:00
local::MyProcessor(
system, allocator, crashDumpDirectory, useNativeFeatures);
}
2014-07-11 15:50:18 +00:00
} // namespace vm