/*
* Copyright (C) 2008 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifdef WITH_JIT
/*
* Target independent portion of Android's Jit
*/
#include "Dalvik.h"
#include "Jit.h"
#include "libdex/DexOpcodes.h"
#include <unistd.h>
#include <pthread.h>
#include <sys/time.h>
#include <signal.h>
#include "compiler/Compiler.h"
#include "compiler/CompilerUtility.h"
#include "compiler/CompilerIR.h"
#include <errno.h>
#if defined(WITH_SELF_VERIFICATION)
/* Allocate space for per-thread ShadowSpace data structures */
void* dvmSelfVerificationShadowSpaceAlloc(Thread* self)
{
self->shadowSpace = (ShadowSpace*) calloc(1, sizeof(ShadowSpace));
if (self->shadowSpace == NULL)
return NULL;
self->shadowSpace->registerSpaceSize = REG_SPACE;
self->shadowSpace->registerSpace =
(int*) calloc(self->shadowSpace->registerSpaceSize, sizeof(int));
return self->shadowSpace->registerSpace;
}
/* Free per-thread ShadowSpace data structures */
void dvmSelfVerificationShadowSpaceFree(Thread* self)
{
free(self->shadowSpace->registerSpace);
free(self->shadowSpace);
}
/*
* Save out PC, FP, thread state, and registers to shadow space.
* Return a pointer to the shadow space for JIT to use.
*
* The set of saved state from the Thread structure is:
* pc (Dalvik PC)
* fp (Dalvik FP)
* retval
* method
* methodClassDex
* interpStackEnd
*/
void* dvmSelfVerificationSaveState(const u2* pc, u4* fp,
Thread* self, int targetTrace)
{
ShadowSpace *shadowSpace = self->shadowSpace;
unsigned preBytes = self->interpSave.method->outsSize*4 +
sizeof(StackSaveArea);
unsigned postBytes = self->interpSave.method->registersSize*4;
//ALOGD("### selfVerificationSaveState(%d) pc: %#x fp: %#x",
// self->threadId, (int)pc, (int)fp);
if (shadowSpace->selfVerificationState != kSVSIdle) {
ALOGD("~~~ Save: INCORRECT PREVIOUS STATE(%d): %d",
self->threadId, shadowSpace->selfVerificationState);
ALOGD("********** SHADOW STATE DUMP **********");
ALOGD("PC: %#x FP: %#x", (int)pc, (int)fp);
}
shadowSpace->selfVerificationState = kSVSStart;
// Dynamically grow shadow register space if necessary
if (preBytes + postBytes > shadowSpace->registerSpaceSize * sizeof(u4)) {
free(shadowSpace->registerSpace);
shadowSpace->registerSpaceSize = (preBytes + postBytes) / sizeof(u4);
shadowSpace->registerSpace =
(int*) calloc(shadowSpace->registerSpaceSize, sizeof(u4));
}
// Remember original state
shadowSpace->startPC = pc;
shadowSpace->fp = fp;
shadowSpace->retval = self->interpSave.retval;
shadowSpace->interpStackEnd = self->interpStackEnd;
/*
* Store the original method here in case the trace ends with a
* return/invoke, the last method.
*/
shadowSpace->method = self->interpSave.method;
shadowSpace->methodClassDex = self->interpSave.methodClassDex;
shadowSpace->shadowFP = shadowSpace->registerSpace +
shadowSpace->registerSpaceSize - postBytes/4;
self->interpSave.curFrame = (u4*)shadowSpace->shadowFP;
self->interpStackEnd = (u1*)shadowSpace->registerSpace;
// Create a copy of the stack
memcpy(((char*)shadowSpace->shadowFP)-preBytes, ((char*)fp)-preBytes,
preBytes+postBytes);
// Setup the shadowed heap space
shadowSpace->heapSpaceTail = shadowSpace->heapSpace;
// Reset trace length
shadowSpace->traceLength = 0;
return shadowSpace;
}
/*
* Save ending PC, FP and compiled code exit point to shadow space.
* Return a pointer to the shadow space for JIT to restore state.
*/
void* dvmSelfVerificationRestoreState(const u2* pc, u4* fp,
SelfVerificationState exitState,
Thread* self)
{
ShadowSpace *shadowSpace = self->shadowSpace;
shadowSpace->endPC = pc;
shadowSpace->endShadowFP = fp;
shadowSpace->jitExitState = exitState;
//ALOGD("### selfVerificationRestoreState(%d) pc: %#x fp: %#x endPC: %#x",
// self->threadId, (int)shadowSpace->startPC, (int)shadowSpace->fp,
// (int)pc);
if (shadowSpace->selfVerificationState != kSVSStart) {
ALOGD("~~~ Restore: INCORRECT PREVIOUS STATE(%d): %d",
self->threadId, shadowSpace->selfVerificationState);
ALOGD("********** SHADOW STATE DUMP **********");
ALOGD("Dalvik PC: %#x endPC: %#x", (int)shadowSpace->startPC,
(int)shadowSpace->endPC);
ALOGD("Interp FP: %#x", (int)shadowSpace->fp);
ALOGD("Shadow FP: %#x endFP: %#x", (int)shadowSpace->shadowFP,
(int)shadowSpace->endShadowFP);
}
// Special case when punting after a single instruction
if (exitState == kSVSPunt && pc == shadowSpace->startPC) {
shadowSpace->selfVerificationState = kSVSIdle;
} else {
shadowSpace->selfVerificationState = exitState;
}
/* Restore state before returning */
self->interpSave.pc = shadowSpace->startPC;
self->interpSave.curFrame = shadowSpace->fp;
self->interpSave.method = shadowSpace->method;
self->interpSave.methodClassDex = shadowSpace->methodClassDex;
self->interpSave.retval = shadowSpace->retval;
self->interpStackEnd = shadowSpace->interpStackEnd;
return shadowSpace;
}
/* Print contents of virtual registers */
static void selfVerificationPrintRegisters(int* addr, int* addrRef,
int numWords)
{
int i;
for (i = 0; i < numWords; i++) {
ALOGD("(v%d) 0x%8x%s", i, addr[i], addr[i] != addrRef[i] ? " X" : "");
}
}
/* Print values maintained in shadowSpace */
static void selfVerificationDumpState(const u2* pc, Thread* self)
{
ShadowSpace* shadowSpace = self->shadowSpace;
StackSaveArea* stackSave = SAVEAREA_FROM_FP(self->interpSave.curFrame);
int frameBytes = (int) shadowSpace->registerSpace +
shadowSpace->registerSpaceSize*4 -
(int) shadowSpace->shadowFP;
int localRegs = 0;
int frameBytes2 = 0;
if ((uintptr_t)self->interpSave.curFrame < (uintptr_t)shadowSpace->fp) {
localRegs = (stackSave->method->registersSize -
stackSave->method->insSize)*4;
frameBytes2 = (int) shadowSpace->fp -
(int)self->interpSave.curFrame - localRegs;
}
ALOGD("********** SHADOW STATE DUMP **********");
ALOGD("CurrentPC: %#x, Offset: 0x%04x", (int)pc,
(int)(pc - stackSave->method->insns));
ALOGD("Class: %s", shadowSpace->method->clazz->descriptor);
ALOGD("Method: %s", shadowSpace->method->name);
ALOGD("Dalvik PC: %#x endPC: %#x", (int)shadowSpace->startPC,
(int)shadowSpace->endPC);
ALOGD("Interp FP: %#x endFP: %#x", (int)shadowSpace->fp,
(int)self->interpSave.curFrame);
ALOGD("Shadow FP: %#x endFP: %#x", (int)shadowSpace->shadowFP,
(int)shadowSpace->endShadowFP);
ALOGD("Frame1 Bytes: %d Frame2 Local: %d Bytes: %d", frameBytes,
localRegs, frameBytes2);
ALOGD("Trace length: %d State: %d", shadowSpace->traceLength,
shadowSpace->selfVerificationState);
}
/* Print decoded instructions in the current trace */
static void selfVerificationDumpTrace(const u2* pc, Thread* self)
{
ShadowSpace* shadowSpace = self->shadowSpace;
StackSaveArea* stackSave = SAVEAREA_FROM_FP(self->interpSave.curFrame);
int i, addr, offset;
DecodedInstruction *decInsn;
ALOGD("********** SHADOW TRACE DUMP **********");
for (i = 0; i < shadowSpace->traceLength; i++) {
addr = shadowSpace->trace[i].addr;
offset = (int)((u2*)addr - stackSave->method->insns);
decInsn = &(shadowSpace->trace[i].decInsn);
/* Not properly decoding instruction, some registers may be garbage */
ALOGD("%#x: (0x%04x) %s",
addr, offset, dexGetOpcodeName(decInsn->opcode));
}
}
/* Code is forced into this spin loop when a divergence is detected */
static void selfVerificationSpinLoop(ShadowSpace *shadowSpace)
{
const u2 *startPC = shadowSpace->startPC;
JitTraceDescription* desc = dvmCopyTraceDescriptor(startPC, NULL);
if (desc) {
dvmCompilerWorkEnqueue(startPC, kWorkOrderTraceDebug, desc);
/*
* This function effectively terminates the VM right here, so not
* freeing the desc pointer when the enqueuing fails is acceptable.
*/
}
gDvmJit.selfVerificationSpin = true;
while(gDvmJit.selfVerificationSpin) sleep(10);
}
/*
* If here, we're re-interpreting an instruction that was included
* in a trace that was just executed. This routine is called for
* each instruction in the original trace, and compares state
* when it reaches the end point.
*
* TUNING: the interpretation mechanism now supports a counted
* single-step mechanism. If we were to associate an instruction
* count with each trace exit, we could just single-step the right
* number of cycles and then compare. This would improve detection
* of control divergences, as well as (slightly) simplify this code.
*/
void dvmCheckSelfVerification(const u2* pc, Thread* self)
{
ShadowSpace *shadowSpace = self->shadowSpace;
SelfVerificationState state = shadowSpace->selfVerificationState;
DecodedInstruction decInsn;
dexDecodeInstruction(pc, &decInsn);
//ALOGD("### DbgIntp(%d): PC: %#x endPC: %#x state: %d len: %d %s",
// self->threadId, (int)pc, (int)shadowSpace->endPC, state,
// shadowSpace->traceLength, dexGetOpcodeName(decInsn.opcode));
if (state == kSVSIdle || state == kSVSStart) {
ALOGD("~~~ DbgIntrp: INCORRECT PREVIOUS STATE(%d): %d",
self->threadId, state);
selfVerificationDumpState(pc, self);
selfVerificationDumpTrace(pc, self);
}
/*
* Generalize the self verification state to kSVSDebugInterp unless the
* entry reason is kSVSBackwardBranch or kSVSSingleStep.
*/
if (state != kSVSBackwardBranch && state != kSVSSingleStep) {
shadowSpace->selfVerificationState = kSVSDebugInterp;
}
/*
* Check if the current pc matches the endPC. Only check for non-zero
* trace length when backward branches are involved.
*/
if (pc == shadowSpace->endPC &&
(state == kSVSDebugInterp || state == kSVSSingleStep ||
(state == kSVSBackwardBranch && shadowSpace->traceLength != 0))) {
shadowSpace->selfVerificationState = kSVSIdle;
/* Check register space */
int frameBytes = (int) shadowSpace->registerSpace +
shadowSpace->registerSpaceSize*4 -
(int) shadowSpace->shadowFP;
if (memcmp(shadowSpace->fp, shadowSpace->shadowFP, frameBytes)) {
if (state == kSVSBackwardBranch) {
/* State mismatch on backward branch - try one more iteration */
shadowSpace->selfVerificationState = kSVSDebugInterp;
goto log_and_continue;
}
ALOGD("~~~ DbgIntp(%d): REGISTERS DIVERGENCE!", self->threadId);
selfVerificationDumpState(pc, self);
selfVerificationDumpTrace(pc, self);
ALOGD("*** Interp Registers: addr: %#x bytes: %d",
(int)shadowSpace->fp, frameBytes);
selfVerificationPrintRegisters((int*)shadowSpace->fp,
(int*)shadowSpace->shadowFP,
frameBytes/4);
ALOGD("*** Shadow Registers: addr: %#x bytes: %d",
(int)shadowSpace->shadowFP, frameBytes);
selfVerificationPrintRegisters((int*)shadowSpace->shadowFP,
(int*)shadowSpace->fp,
frameBytes/4);
selfVerificationSpinLoop(shadowSpace);
}
/* Check new frame if it exists (invokes only) */
if ((uintptr_t)self->interpSave.curFrame < (uintptr_t)shadowSpace->fp) {
StackSaveArea* stackSave =
SAVEAREA_FROM_FP(self->interpSave.curFrame);
int localRegs = (stackSave->method->registersSize -
stackSave->method->insSize)*4;
int frameBytes2 = (int) shadowSpace->fp -
(int) self->interpSave.curFrame - localRegs;
if (memcmp(((char*)self->interpSave.curFrame)+localRegs,
((char*)shadowSpace->endShadowFP)+localRegs, frameBytes2)) {
if (state == kSVSBackwardBranch) {
/*
* State mismatch on backward branch - try one more
* iteration.
*/
shadowSpace->selfVerificationState = kSVSDebugInterp;
goto log_and_continue;
}
ALOGD("~~~ DbgIntp(%d): REGISTERS (FRAME2) DIVERGENCE!",
self->threadId);
selfVerificationDumpState(pc, self);
selfVerificationDumpTrace(pc, self);
ALOGD("*** Interp Registers: addr: %#x l: %d bytes: %d",
(int)self->interpSave.curFrame, localRegs, frameBytes2);
selfVerificationPrintRegisters((int*)self->interpSave.curFrame,
(int*)shadowSpace->endShadowFP,
(frameBytes2+localRegs)/4);
ALOGD("*** Shadow Registers: addr: %#x l: %d bytes: %d",
(int)shadowSpace->endShadowFP, localRegs, frameBytes2);
selfVerificationPrintRegisters((int*)shadowSpace->endShadowFP,
(int*)self->interpSave.curFrame,
(frameBytes2+localRegs)/4);
selfVerificationSpinLoop(shadowSpace);
}
}
/* Check memory space */
bool memDiff = false;
ShadowHeap* heapSpacePtr;
for (heapSpacePtr = shadowSpace->heapSpace;
heapSpacePtr != shadowSpace->heapSpaceTail; heapSpacePtr++) {
int memData = *((unsigned int*) heapSpacePtr->addr);
if (heapSpacePtr->data != memData) {
if (state == kSVSBackwardBranch) {
/*
* State mismatch on backward branch - try one more
* iteration.
*/
shadowSpace->selfVerificationState = kSVSDebugInterp;
goto log_and_continue;
}
ALOGD("~~~ DbgIntp(%d): MEMORY DIVERGENCE!", self->threadId);
ALOGD("Addr: %#x Intrp Data: %#x Jit Data: %#x",
heapSpacePtr->addr, memData, heapSpacePtr->data);
selfVerificationDumpState(pc, self);
selfVerificationDumpTrace(pc, self);
memDiff = true;
}
}
if (memDiff) selfVerificationSpinLoop(shadowSpace);
/*
* Success. If this shadowed trace included a single-stepped
* instruction, we need to stay in the interpreter for one
* more interpretation before resuming.
*/
if (state == kSVSSingleStep) {
assert(self->jitResumeNPC != NULL);
assert(self->singleStepCount == 0);
self->singleStepCount = 1;
dvmEnableSubMode(self, kSubModeCountedStep);
}
/*
* Switch off shadow replay mode. The next shadowed trace
* execution will turn it back on.
*/
dvmDisableSubMode(self, kSubModeJitSV);
self->jitState = kJitDone;
return;
}
log_and_continue:
/* If end not been reached, make sure max length not exceeded */
if (shadowSpace->traceLength >= JIT_MAX_TRACE_LEN) {
ALOGD("~~~ DbgIntp(%d): CONTROL DIVERGENCE!", self->threadId);
ALOGD("startPC: %#x endPC: %#x currPC: %#x",
(int)shadowSpace->startPC, (int)shadowSpace->endPC, (int)pc);
selfVerificationDumpState(pc, self);
selfVerificationDumpTrace(pc, self);
selfVerificationSpinLoop(shadowSpace);
return;
}
/* Log the instruction address and decoded instruction for debug */
shadowSpace->trace[shadowSpace->traceLength].addr = (int)pc;
shadowSpace->trace[shadowSpace->traceLength].decInsn = decInsn;
shadowSpace->traceLength++;
}
#endif
/*
* If one of our fixed tables or the translation buffer fills up,
* call this routine to avoid wasting cycles on future translation requests.
*/
void dvmJitStopTranslationRequests()
{
/*
* Note 1: This won't necessarily stop all translation requests, and
* operates on a delayed mechanism. Running threads look to the copy
* of this value in their private thread structures and won't see
* this change until it is refreshed (which happens on interpreter
* entry).
* Note 2: This is a one-shot memory leak on this table. Because this is a
* permanent off switch for Jit profiling, it is a one-time leak of 1K
* bytes, and no further attempt will be made to re-allocate it. Can't
* free it because some thread may be holding a reference.
*/
gDvmJit.pProfTable = NULL;
dvmJitUpdateThreadStateAll();
}
#if defined(WITH_JIT_TUNING)
/* Convenience function to increment counter from assembly code */
void dvmBumpNoChain(int from)
{
gDvmJit.noChainExit[from]++;
}
/* Convenience function to increment counter from assembly code */
void dvmBumpNormal()
{
gDvmJit.normalExit++;
}
/* Convenience function to increment counter from assembly code */
void dvmBumpPunt(int from)
{
gDvmJit.puntExit++;
}
#endif
/* Dumps debugging & tuning stats to the log */
void dvmJitStats()
{
int i;
int hit;
int not_hit;
int chains;
int stubs;
if (gDvmJit.pJitEntryTable) {
for (i=0, stubs=chains=hit=not_hit=0;
i < (int) gDvmJit.jitTableSize;
i++) {
if (gDvmJit.pJitEntryTable[i].dPC != 0) {
hit++;
if (gDvmJit.pJitEntryTable[i].codeAddress ==
dvmCompilerGetInterpretTemplate())
stubs++;
} else
not_hit++;
if (gDvmJit.pJitEntryTable[i].u.info.chain != gDvmJit.jitTableSize)
chains++;
}
ALOGD("JIT: table size is %d, entries used is %d",
gDvmJit.jitTableSize, gDvmJit.jitTableEntriesUsed);
ALOGD("JIT: %d traces, %d slots, %d chains, %d thresh, %s",
hit, not_hit + hit, chains, gDvmJit.threshold,
gDvmJit.blockingMode ? "Blocking" : "Non-blocking");
#if defined(WITH_JIT_TUNING)
ALOGD("JIT: Code cache patches: %d", gDvmJit.codeCachePatches);
ALOGD("JIT: Lookups: %d hits, %d misses; %d normal, %d punt",
gDvmJit.addrLookupsFound, gDvmJit.addrLookupsNotFound,
gDvmJit.normalExit, gDvmJit.puntExit);
ALOGD("JIT: ICHits: %d", gDvmICHitCount);
ALOGD("JIT: noChainExit: %d IC miss, %d interp callsite, "
"%d switch overflow",
gDvmJit.noChainExit[kInlineCacheMiss],
gDvmJit.noChainExit[kCallsiteInterpreted],
gDvmJit.noChainExit[kSwitchOverflow]);
ALOGD("JIT: ICPatch: %d init, %d rejected, %d lock-free, %d queued, "
"%d dropped",
gDvmJit.icPatchInit, gDvmJit.icPatchRejected,
gDvmJit.icPatchLockFree, gDvmJit.icPatchQueued,
gDvmJit.icPatchDropped);
ALOGD("JIT: Invoke: %d mono, %d poly, %d native, %d return",
gDvmJit.invokeMonomorphic, gDvmJit.invokePolymorphic,
gDvmJit.invokeNative, gDvmJit.returnOp);
ALOGD("JIT: Inline: %d mgetter, %d msetter, %d pgetter, %d psetter",
gDvmJit.invokeMonoGetterInlined, gDvmJit.invokeMonoSetterInlined,
gDvmJit.invokePolyGetterInlined, gDvmJit.invokePolySetterInlined);
ALOGD("JIT: Total compilation time: %llu ms", gDvmJit.jitTime / 1000);
ALOGD("JIT: Avg unit compilation time: %llu us",
gDvmJit.numCompilations == 0 ? 0 :
gDvmJit.jitTime / gDvmJit.numCompilations);
ALOGD("JIT: Potential GC blocked by compiler: max %llu us / "
"avg %llu us (%d)",
gDvmJit.maxCompilerThreadBlockGCTime,
gDvmJit.numCompilerThreadBlockGC == 0 ?
0 : gDvmJit.compilerThreadBlockGCTime /
gDvmJit.numCompilerThreadBlockGC,
gDvmJit.numCompilerThreadBlockGC);
#endif
ALOGD("JIT: %d Translation chains, %d interp stubs",
gDvmJit.translationChains, stubs);
if (gDvmJit.profileMode == kTraceProfilingContinuous) {
dvmCompilerSortAndPrintTraceProfiles();
}
}
}
/* End current trace now & don't include current instruction */
void dvmJitEndTraceSelect(Thread* self, const u2* dPC)
{
if (self->jitState == kJitTSelect) {
self->jitState = kJitTSelectEnd;
}
if (self->jitState == kJitTSelectEnd) {
// Clean up and finish now.
dvmCheckJit(dPC, self);
}
}
/*
* Find an entry in the JitTable, creating if necessary.
* Returns null if table is full.
*/
static JitEntry *lookupAndAdd(const u2* dPC, bool callerLocked,
bool isMethodEntry)
{
u4 chainEndMarker = gDvmJit.jitTableSize;
u4 idx = dvmJitHash(dPC);
/*
* Walk the bucket chain to find an exact match for our PC and trace/method
* type
*/
while ((gDvmJit.pJitEntryTable[idx].u.info.chain != chainEndMarker) &&
((gDvmJit.pJitEntryTable[idx].dPC != dPC) ||
(gDvmJit.pJitEntryTable[idx].u.info.isMethodEntry !=
isMethodEntry))) {
idx = gDvmJit.pJitEntryTable[idx].u.info.chain;
}
if (gDvmJit.pJitEntryTable[idx].dPC != dPC ||
gDvmJit.pJitEntryTable[idx].u.info.isMethodEntry != isMethodEntry) {
/*
* No match. Aquire jitTableLock and find the last
* slot in the chain. Possibly continue the chain walk in case
* some other thread allocated the slot we were looking
* at previuosly (perhaps even the dPC we're trying to enter).
*/
if (!callerLocked)
dvmLockMutex(&gDvmJit.tableLock);
/*
* At this point, if .dPC is NULL, then the slot we're
* looking at is the target slot from the primary hash
* (the simple, and common case). Otherwise we're going
* to have to find a free slot and chain it.
*/
ANDROID_MEMBAR_FULL(); /* Make sure we reload [].dPC after lock */
if (gDvmJit.pJitEntryTable[idx].dPC != NULL) {
u4 prev;
while (gDvmJit.pJitEntryTable[idx].u.info.chain != chainEndMarker) {
if (gDvmJit.pJitEntryTable[idx].dPC == dPC &&
gDvmJit.pJitEntryTable[idx].u.info.isMethodEntry ==
isMethodEntry) {
/* Another thread got there first for this dPC */
if (!callerLocked)
dvmUnlockMutex(&gDvmJit.tableLock);
return &gDvmJit.pJitEntryTable[idx];
}
idx = gDvmJit.pJitEntryTable[idx].u.info.chain;
}
/* Here, idx should be pointing to the last cell of an
* active chain whose last member contains a valid dPC */
assert(gDvmJit.pJitEntryTable[idx].dPC != NULL);
/* Linear walk to find a free cell and add it to the end */
prev = idx;
while (true) {
idx++;
if (idx == chainEndMarker)
idx = 0; /* Wraparound */
if ((gDvmJit.pJitEntryTable[idx].dPC == NULL) ||
(idx == prev))
break;
}
if (idx != prev) {
JitEntryInfoUnion oldValue;
JitEntryInfoUnion newValue;
/*
* Although we hold the lock so that noone else will
* be trying to update a chain field, the other fields
* packed into the word may be in use by other threads.
*/
do {
oldValue = gDvmJit.pJitEntryTable[prev].u;
newValue = oldValue;
newValue.info.chain = idx;
} while (android_atomic_release_cas(oldValue.infoWord,
newValue.infoWord,
&gDvmJit.pJitEntryTable[prev].u.infoWord) != 0);
}
}
if (gDvmJit.pJitEntryTable[idx].dPC == NULL) {
gDvmJit.pJitEntryTable[idx].u.info.isMethodEntry = isMethodEntry;
/*
* Initialize codeAddress and allocate the slot. Must
* happen in this order (since dPC is set, the entry is live.
*/
android_atomic_release_store((int32_t)dPC,
(volatile int32_t *)(void *)&gDvmJit.pJitEntryTable[idx].dPC);
/* for simulator mode, we need to initialized codeAddress to null */
gDvmJit.pJitEntryTable[idx].codeAddress = NULL;
gDvmJit.pJitEntryTable[idx].dPC = dPC;
gDvmJit.jitTableEntriesUsed++;
} else {
/* Table is full */
idx = chainEndMarker;
}
if (!callerLocked)
dvmUnlockMutex(&gDvmJit.tableLock);
}
return (idx == chainEndMarker) ? NULL : &gDvmJit.pJitEntryTable[idx];
}
/* Dump a trace description */
void dvmJitDumpTraceDesc(JitTraceDescription *trace)
{
int i;
bool done = false;
const u2* dpc;
const u2* dpcBase;
int curFrag = 0;
ALOGD("===========================================");
ALOGD("Trace dump %#x, Method %s off %#x",(int)trace,
trace->method->name,trace->trace[curFrag].info.frag.startOffset);
dpcBase = trace->method->insns;
while (!done) {
DecodedInstruction decInsn;
if (trace->trace[curFrag].isCode) {
ALOGD("Frag[%d]- Insts: %d, start: %#x, hint: %#x, end: %d",
curFrag, trace->trace[curFrag].info.frag.numInsts,
trace->trace[curFrag].info.frag.startOffset,
trace->trace[curFrag].info.frag.hint,
trace->trace[curFrag].info.frag.runEnd);
dpc = dpcBase + trace->trace[curFrag].info.frag.startOffset;
for (i=0; i<trace->trace[curFrag].info.frag.numInsts; i++) {
dexDecodeInstruction(dpc, &decInsn);
ALOGD(" 0x%04x - %s %#x",(dpc-dpcBase),
dexGetOpcodeName(decInsn.opcode),(int)dpc);
dpc += dexGetWidthFromOpcode(decInsn.opcode);
}
if (trace->trace[curFrag].info.frag.runEnd) {
done = true;
}
} else {
ALOGD("Frag[%d]- META info: 0x%08x", curFrag,
(int)trace->trace[curFrag].info.meta);
}
curFrag++;
}
ALOGD("-------------------------------------------");
}
/*
* Append the class ptr of "this" and the current method ptr to the current
* trace. That is, the trace runs will contain the following components:
* + trace run that ends with an invoke (existing entry)
* + thisClass (new)
* + calleeMethod (new)
*/
static void insertClassMethodInfo(Thread* self,
const ClassObject* thisClass,
const Method* calleeMethod,
const DecodedInstruction* insn)
{
int currTraceRun = ++self->currTraceRun;
self->trace[currTraceRun].info.meta = thisClass ?
(void *) thisClass->descriptor : NULL;
self->trace[currTraceRun].isCode = false;
currTraceRun = ++self->currTraceRun;
self->trace[currTraceRun].info.meta = thisClass ?
(void *) thisClass->classLoader : NULL;
self->trace[currTraceRun].isCode = false;
currTraceRun = ++self->currTraceRun;
self->trace[currTraceRun].info.meta = (void *) calleeMethod;
self->trace[currTraceRun].isCode = false;
}
/*
* Check if the next instruction following the invoke is a move-result and if
* so add it to the trace. That is, this will add the trace run that includes
* the move-result to the trace list.
*
* + trace run that ends with an invoke (existing entry)
* + thisClass (existing entry)
* + calleeMethod (existing entry)
* + move result (new)
*
* lastPC, len, offset are all from the preceding invoke instruction
*/
static void insertMoveResult(const u2 *lastPC, int len, int offset,
Thread *self)
{
DecodedInstruction nextDecInsn;
const u2 *moveResultPC = lastPC + len;
dexDecodeInstruction(moveResultPC, &nextDecInsn);
if ((nextDecInsn.opcode != OP_MOVE_RESULT) &&
(nextDecInsn.opcode != OP_MOVE_RESULT_WIDE) &&
(nextDecInsn.opcode != OP_MOVE_RESULT_OBJECT))
return;
/* We need to start a new trace run */
int currTraceRun = ++self->currTraceRun;
self->currRunHead = moveResultPC;
self->trace[currTraceRun].info.frag.startOffset = offset + len;
self->trace[currTraceRun].info.frag.numInsts = 1;
self->trace[currTraceRun].info.frag.runEnd = false;
self->trace[currTraceRun].info.frag.hint = kJitHintNone;
self->trace[currTraceRun].isCode = true;
self->totalTraceLen++;
self->currRunLen = dexGetWidthFromInstruction(moveResultPC);
}
/*
* Adds to the current trace request one instruction at a time, just
* before that instruction is interpreted. This is the primary trace
* selection function. NOTE: return instruction are handled a little
* differently. In general, instructions are "proposed" to be added
* to the current trace prior to interpretation. If the interpreter
* then successfully completes the instruction, is will be considered
* part of the request. This allows us to examine machine state prior
* to interpretation, and also abort the trace request if the instruction
* throws or does something unexpected. However, return instructions
* will cause an immediate end to the translation request - which will
* be passed to the compiler before the return completes. This is done
* in response to special handling of returns by the interpreter (and
* because returns cannot throw in a way that causes problems for the
* translated code.
*/
void dvmCheckJit(const u2* pc, Thread* self)
{
const ClassObject *thisClass = self->callsiteClass;
const Method* curMethod = self->methodToCall;
int flags, len;
int allDone = false;
/* Stay in break/single-stop mode for the next instruction */
bool stayOneMoreInst = false;
/* Prepare to handle last PC and stage the current PC & method*/
const u2 *lastPC = self->lastPC;
self->lastPC = pc;
switch (self->jitState) {
int offset;
DecodedInstruction decInsn;
case kJitTSelect:
/* First instruction - just remember the PC and exit */
if (lastPC == NULL) break;
/* Grow the trace around the last PC if jitState is kJitTSelect */
dexDecodeInstruction(lastPC, &decInsn);
#if TRACE_OPCODE_FILTER
/* Only add JIT support opcode to trace. End the trace if
* this opcode is not supported.
*/
if (!dvmIsOpcodeSupportedByJit(decInsn.opcode)) {
self->jitState = kJitTSelectEnd;
break;
}
#endif
/*
* Treat {PACKED,SPARSE}_SWITCH as trace-ending instructions due
* to the amount of space it takes to generate the chaining
* cells.
*/
if (self->totalTraceLen != 0 &&
(decInsn.opcode == OP_PACKED_SWITCH ||
decInsn.opcode == OP_SPARSE_SWITCH)) {
self->jitState = kJitTSelectEnd;
break;
}
#if defined(SHOW_TRACE)
ALOGD("TraceGen: adding %s. lpc:%#x, pc:%#x",
dexGetOpcodeName(decInsn.opcode), (int)lastPC, (int)pc);
#endif
flags = dexGetFlagsFromOpcode(decInsn.opcode);
len = dexGetWidthFromInstruction(lastPC);
offset = lastPC - self->traceMethod->insns;
assert((unsigned) offset <
dvmGetMethodInsnsSize(self->traceMethod));
if (lastPC != self->currRunHead + self->currRunLen) {
int currTraceRun;
/* We need to start a new trace run */
currTraceRun = ++self->currTraceRun;
self->currRunLen = 0;
self->currRunHead = (u2*)lastPC;
self->trace[currTraceRun].info.frag.startOffset = offset;
self->trace[currTraceRun].info.frag.numInsts = 0;
self->trace[currTraceRun].info.frag.runEnd = false;
self->trace[currTraceRun].info.frag.hint = kJitHintNone;
self->trace[currTraceRun].isCode = true;
}
self->trace[self->currTraceRun].info.frag.numInsts++;
self->totalTraceLen++;
self->currRunLen += len;
/*
* If the last instruction is an invoke, we will try to sneak in
* the move-result* (if existent) into a separate trace run.
*/
{
int needReservedRun = (flags & kInstrInvoke) ? 1 : 0;
/* Will probably never hit this with the current trace builder */
if (self->currTraceRun ==
(MAX_JIT_RUN_LEN - 1 - needReservedRun)) {
self->jitState = kJitTSelectEnd;
}
}
if (!dexIsGoto(flags) &&
((flags & (kInstrCanBranch |
kInstrCanSwitch |
kInstrCanReturn |
kInstrInvoke)) != 0)) {
self->jitState = kJitTSelectEnd;
#if defined(SHOW_TRACE)
ALOGD("TraceGen: ending on %s, basic block end",
dexGetOpcodeName(decInsn.opcode));
#endif
/*
* If the current invoke is a {virtual,interface}, get the
* current class/method pair into the trace as well.
* If the next instruction is a variant of move-result, insert
* it to the trace too.
*/
if (flags & kInstrInvoke) {
insertClassMethodInfo(self, thisClass, curMethod,
&decInsn);
insertMoveResult(lastPC, len, offset, self);
}
}
/* Break on throw or self-loop */
if ((decInsn.opcode == OP_THROW) || (lastPC == pc)){
self->jitState = kJitTSelectEnd;
}
if (self->totalTraceLen >= JIT_MAX_TRACE_LEN) {
self->jitState = kJitTSelectEnd;
}
if ((flags & kInstrCanReturn) != kInstrCanReturn) {
break;
}
else {
/*
* Last instruction is a return - stay in the dbg interpreter
* for one more instruction if it is a non-void return, since
* we don't want to start a trace with move-result as the first
* instruction (which is already included in the trace
* containing the invoke.
*/
if (decInsn.opcode != OP_RETURN_VOID) {
stayOneMoreInst = true;
}
}
/* NOTE: intentional fallthrough for returns */
case kJitTSelectEnd:
{
/* Empty trace - set to bail to interpreter */
if (self->totalTraceLen == 0) {
dvmJitSetCodeAddr(self->currTraceHead,
dvmCompilerGetInterpretTemplate(),
dvmCompilerGetInterpretTemplateSet(),
false /* Not method entry */, 0);
self->jitState = kJitDone;
allDone = true;
break;
}
int lastTraceDesc = self->currTraceRun;
/* Extend a new empty desc if the last slot is meta info */
if (!self->trace[lastTraceDesc].isCode) {
lastTraceDesc = ++self->currTraceRun;
self->trace[lastTraceDesc].info.frag.startOffset = 0;
self->trace[lastTraceDesc].info.frag.numInsts = 0;
self->trace[lastTraceDesc].info.frag.hint = kJitHintNone;
self->trace[lastTraceDesc].isCode = true;
}
/* Mark the end of the trace runs */
self->trace[lastTraceDesc].info.frag.runEnd = true;
JitTraceDescription* desc =
(JitTraceDescription*)malloc(sizeof(JitTraceDescription) +
sizeof(JitTraceRun) * (self->currTraceRun+1));
if (desc == NULL) {
ALOGE("Out of memory in trace selection");
dvmJitStopTranslationRequests();
self->jitState = kJitDone;
allDone = true;
break;
}
desc->method = self->traceMethod;
memcpy((char*)&(desc->trace[0]),
(char*)&(self->trace[0]),
sizeof(JitTraceRun) * (self->currTraceRun+1));
#if defined(SHOW_TRACE)
ALOGD("TraceGen: trace done, adding to queue");
dvmJitDumpTraceDesc(desc);
#endif
if (dvmCompilerWorkEnqueue(
self->currTraceHead,kWorkOrderTrace,desc)) {
/* Work order successfully enqueued */
if (gDvmJit.blockingMode) {
dvmCompilerDrainQueue();
}
} else {
/*
* Make sure the descriptor for the abandoned work order is
* freed.
*/
free(desc);
}
self->jitState = kJitDone;
allDone = true;
}
break;
case kJitDone:
allDone = true;
break;
case kJitNot:
allDone = true;
break;
default:
ALOGE("Unexpected JIT state: %d", self->jitState);
dvmAbort();
break;
}
/*
* If we're done with trace selection, switch off the control flags.
*/
if (allDone) {
dvmDisableSubMode(self, kSubModeJitTraceBuild);
if (stayOneMoreInst) {
// Clear jitResumeNPC explicitly since we know we don't need it
// here.
self->jitResumeNPC = NULL;
// Keep going in single-step mode for at least one more inst
if (self->singleStepCount == 0)
self->singleStepCount = 1;
dvmEnableSubMode(self, kSubModeCountedStep);
}
}
return;
}
JitEntry *dvmJitFindEntry(const u2* pc, bool isMethodEntry)
{
int idx = dvmJitHash(pc);
/* Expect a high hit rate on 1st shot */
if ((gDvmJit.pJitEntryTable[idx].dPC == pc) &&
(gDvmJit.pJitEntryTable[idx].u.info.isMethodEntry == isMethodEntry))
return &gDvmJit.pJitEntryTable[idx];
else {
int chainEndMarker = gDvmJit.jitTableSize;
while (gDvmJit.pJitEntryTable[idx].u.info.chain != chainEndMarker) {
idx = gDvmJit.pJitEntryTable[idx].u.info.chain;
if ((gDvmJit.pJitEntryTable[idx].dPC == pc) &&
(gDvmJit.pJitEntryTable[idx].u.info.isMethodEntry ==
isMethodEntry))
return &gDvmJit.pJitEntryTable[idx];
}
}
return NULL;
}
/*
* Walk through the JIT profile table and find the corresponding JIT code, in
* the specified format (ie trace vs method). This routine needs to be fast.
*/
void* getCodeAddrCommon(const u2* dPC, bool methodEntry)
{
int idx = dvmJitHash(dPC);
const u2* pc = gDvmJit.pJitEntryTable[idx].dPC;
if (pc != NULL) {
bool hideTranslation = dvmJitHideTranslation();
if (pc == dPC &&
gDvmJit.pJitEntryTable[idx].u.info.isMethodEntry == methodEntry) {
int offset = (gDvmJit.profileMode >= kTraceProfilingContinuous) ?
0 : gDvmJit.pJitEntryTable[idx].u.info.profileOffset;
intptr_t codeAddress =
(intptr_t)gDvmJit.pJitEntryTable[idx].codeAddress;
#if defined(WITH_JIT_TUNING)
gDvmJit.addrLookupsFound++;
#endif
return hideTranslation || !codeAddress ? NULL :
(void *)(codeAddress + offset);
} else {
int chainEndMarker = gDvmJit.jitTableSize;
while (gDvmJit.pJitEntryTable[idx].u.info.chain != chainEndMarker) {
idx = gDvmJit.pJitEntryTable[idx].u.info.chain;
if (gDvmJit.pJitEntryTable[idx].dPC == dPC &&
gDvmJit.pJitEntryTable[idx].u.info.isMethodEntry ==
methodEntry) {
int offset = (gDvmJit.profileMode >=
kTraceProfilingContinuous) ? 0 :
gDvmJit.pJitEntryTable[idx].u.info.profileOffset;
intptr_t codeAddress =
(intptr_t)gDvmJit.pJitEntryTable[idx].codeAddress;
#if defined(WITH_JIT_TUNING)
gDvmJit.addrLookupsFound++;
#endif
return hideTranslation || !codeAddress ? NULL :
(void *)(codeAddress + offset);
}
}
}
}
#if defined(WITH_JIT_TUNING)
gDvmJit.addrLookupsNotFound++;
#endif
return NULL;
}
/*
* If a translated code address, in trace format, exists for the davik byte code
* pointer return it.
*/
void* dvmJitGetTraceAddr(const u2* dPC)
{
return getCodeAddrCommon(dPC, false /* method entry */);
}
/*
* If a translated code address, in whole-method format, exists for the davik
* byte code pointer return it.
*/
void* dvmJitGetMethodAddr(const u2* dPC)
{
return getCodeAddrCommon(dPC, true /* method entry */);
}
/*
* Similar to dvmJitGetTraceAddr, but returns null if the calling
* thread is in a single-step mode.
*/
void* dvmJitGetTraceAddrThread(const u2* dPC, Thread* self)
{
return (self->interpBreak.ctl.breakFlags != 0) ? NULL :
getCodeAddrCommon(dPC, false /* method entry */);
}
/*
* Similar to dvmJitGetMethodAddr, but returns null if the calling
* thread is in a single-step mode.
*/
void* dvmJitGetMethodAddrThread(const u2* dPC, Thread* self)
{
return (self->interpBreak.ctl.breakFlags != 0) ? NULL :
getCodeAddrCommon(dPC, true /* method entry */);
}
/*
* Register the translated code pointer into the JitTable.
* NOTE: Once a codeAddress field transitions from initial state to
* JIT'd code, it must not be altered without first halting all
* threads. We defer the setting of the profile prefix size until
* after the new code address is set to ensure that the prefix offset
* is never applied to the initial interpret-only translation. All
* translations with non-zero profile prefixes will still be correct
* if entered as if the profile offset is 0, but the interpret-only
* template cannot handle a non-zero prefix.
* NOTE: JitTable must not be in danger of reset while this
* code is executing. see Issue 4271784 for details.
*/
void dvmJitSetCodeAddr(const u2* dPC, void *nPC, JitInstructionSetType set,
bool isMethodEntry, int profilePrefixSize)
{
JitEntryInfoUnion oldValue;
JitEntryInfoUnion newValue;
/*
* Get the JitTable slot for this dPC (or create one if JitTable
* has been reset between the time the trace was requested and
* now.
*/
JitEntry *jitEntry = isMethodEntry ?
lookupAndAdd(dPC, false /* caller holds tableLock */, isMethodEntry) :
dvmJitFindEntry(dPC, isMethodEntry);
assert(jitEntry);
/* Note: order of update is important */
do {
oldValue = jitEntry->u;
newValue = oldValue;
newValue.info.isMethodEntry = isMethodEntry;
newValue.info.instructionSet = set;
newValue.info.profileOffset = profilePrefixSize;
} while (android_atomic_release_cas(
oldValue.infoWord, newValue.infoWord,
&jitEntry->u.infoWord) != 0);
jitEntry->codeAddress = nPC;
}
/*
* Determine if valid trace-bulding request is active. If so, set
* the proper flags in interpBreak and return. Trace selection will
* then begin normally via dvmCheckBefore.
*/
void dvmJitCheckTraceRequest(Thread* self)
{
int i;
/*
* A note on trace "hotness" filtering:
*
* Our first level trigger is intentionally loose - we need it to
* fire easily not just to identify potential traces to compile, but
* also to allow re-entry into the code cache.
*
* The 2nd level filter (done here) exists to be selective about
* what we actually compile. It works by requiring the same
* trace head "key" (defined as filterKey below) to appear twice in
* a relatively short period of time. The difficulty is defining the
* shape of the filterKey. Unfortunately, there is no "one size fits
* all" approach.
*
* For spiky execution profiles dominated by a smallish
* number of very hot loops, we would want the second-level filter
* to be very selective. A good selective filter is requiring an
* exact match of the Dalvik PC. In other words, defining filterKey as:
* intptr_t filterKey = (intptr_t)self->interpSave.pc
*
* However, for flat execution profiles we do best when aggressively
* translating. A heuristically decent proxy for this is to use
* the value of the method pointer containing the trace as the filterKey.
* Intuitively, this is saying that once any trace in a method appears hot,
* immediately translate any other trace from that same method that
* survives the first-level filter. Here, filterKey would be defined as:
* intptr_t filterKey = (intptr_t)self->interpSave.method
*
* The problem is that we can't easily detect whether we're dealing
* with a spiky or flat profile. If we go with the "pc" match approach,
* flat profiles perform poorly. If we go with the loose "method" match,
* we end up generating a lot of useless translations. Probably the
* best approach in the future will be to retain profile information
* across runs of each application in order to determine it's profile,
* and then choose once we have enough history.
*
* However, for now we've decided to chose a compromise filter scheme that
* includes elements of both. The high order bits of the filter key
* are drawn from the enclosing method, and are combined with a slice
* of the low-order bits of the Dalvik pc of the trace head. The
* looseness of the filter can be adjusted by changing with width of
* the Dalvik pc slice (JIT_TRACE_THRESH_FILTER_PC_BITS). The wider
* the slice, the tighter the filter.
*
* Note: the fixed shifts in the function below reflect assumed word
* alignment for method pointers, and half-word alignment of the Dalvik pc.
* for method pointers and half-word alignment for dalvik pc.
*/
u4 methodKey = (u4)self->interpSave.method <<
(JIT_TRACE_THRESH_FILTER_PC_BITS - 2);
u4 pcKey = ((u4)self->interpSave.pc >> 1) &
((1 << JIT_TRACE_THRESH_FILTER_PC_BITS) - 1);
intptr_t filterKey = (intptr_t)(methodKey | pcKey);
// Shouldn't be here if already building a trace.
assert((self->interpBreak.ctl.subMode & kSubModeJitTraceBuild)==0);
/* Check if the JIT request can be handled now */
if ((gDvmJit.pJitEntryTable != NULL) &&
((self->interpBreak.ctl.breakFlags & kInterpSingleStep) == 0)){
/* Bypass the filter for hot trace requests or during stress mode */
if (self->jitState == kJitTSelectRequest &&
gDvmJit.threshold > 6) {
/* Two-level filtering scheme */
for (i=0; i< JIT_TRACE_THRESH_FILTER_SIZE; i++) {
if (filterKey == self->threshFilter[i]) {
self->threshFilter[i] = 0; // Reset filter entry
break;
}
}
if (i == JIT_TRACE_THRESH_FILTER_SIZE) {
/*
* Use random replacement policy - otherwise we could miss a
* large loop that contains more traces than the size of our
* filter array.
*/
i = rand() % JIT_TRACE_THRESH_FILTER_SIZE;
self->threshFilter[i] = filterKey;
self->jitState = kJitDone;
}
}
/* If the compiler is backlogged, cancel any JIT actions */
if (gDvmJit.compilerQueueLength >= gDvmJit.compilerHighWater) {
self->jitState = kJitDone;
}
/*
* Check for additional reasons that might force the trace select
* request to be dropped
*/
if (self->jitState == kJitTSelectRequest ||
self->jitState == kJitTSelectRequestHot) {
if (dvmJitFindEntry(self->interpSave.pc, false)) {
/* In progress - nothing do do */
self->jitState = kJitDone;
} else {
JitEntry *slot = lookupAndAdd(self->interpSave.pc,
false /* lock */,
false /* method entry */);
if (slot == NULL) {
/*
* Table is full. This should have been
* detected by the compiler thread and the table
* resized before we run into it here. Assume bad things
* are afoot and disable profiling.
*/
self->jitState = kJitDone;
ALOGD("JIT: JitTable full, disabling profiling");
dvmJitStopTranslationRequests();
}
}
}
switch (self->jitState) {
case kJitTSelectRequest:
case kJitTSelectRequestHot:
self->jitState = kJitTSelect;
self->traceMethod = self->interpSave.method;
self->currTraceHead = self->interpSave.pc;
self->currTraceRun = 0;
self->totalTraceLen = 0;
self->currRunHead = self->interpSave.pc;
self->currRunLen = 0;
self->trace[0].info.frag.startOffset =
self->interpSave.pc - self->interpSave.method->insns;
self->trace[0].info.frag.numInsts = 0;
self->trace[0].info.frag.runEnd = false;
self->trace[0].info.frag.hint = kJitHintNone;
self->trace[0].isCode = true;
self->lastPC = 0;
/* Turn on trace selection mode */
dvmEnableSubMode(self, kSubModeJitTraceBuild);
#if defined(SHOW_TRACE)
ALOGD("Starting trace for %s at %#x",
self->interpSave.method->name, (int)self->interpSave.pc);
#endif
break;
case kJitDone:
break;
default:
ALOGE("Unexpected JIT state: %d", self->jitState);
dvmAbort();
}
} else {
/* Cannot build trace this time */
self->jitState = kJitDone;
}
}
/*
* Resizes the JitTable. Must be a power of 2, and returns true on failure.
* Stops all threads, and thus is a heavyweight operation. May only be called
* by the compiler thread.
*/
bool dvmJitResizeJitTable( unsigned int size )
{
JitEntry *pNewTable;
JitEntry *pOldTable;
JitEntry tempEntry;
unsigned int oldSize;
unsigned int i;
assert(gDvmJit.pJitEntryTable != NULL);
assert(size && !(size & (size - 1))); /* Is power of 2? */
ALOGI("Jit: resizing JitTable from %d to %d", gDvmJit.jitTableSize, size);
if (size <= gDvmJit.jitTableSize) {
return true;
}
/* Make sure requested size is compatible with chain field width */
tempEntry.u.info.chain = size;
if (tempEntry.u.info.chain != size) {
ALOGD("Jit: JitTable request of %d too big", size);
return true;
}
pNewTable = (JitEntry*)calloc(size, sizeof(*pNewTable));
if (pNewTable == NULL) {
return true;
}
for (i=0; i< size; i++) {
pNewTable[i].u.info.chain = size; /* Initialize chain termination */
}
/* Stop all other interpreting/jit'ng threads */
dvmSuspendAllThreads(SUSPEND_FOR_TBL_RESIZE);
pOldTable = gDvmJit.pJitEntryTable;
oldSize = gDvmJit.jitTableSize;
dvmLockMutex(&gDvmJit.tableLock);
gDvmJit.pJitEntryTable = pNewTable;
gDvmJit.jitTableSize = size;
gDvmJit.jitTableMask = size - 1;
gDvmJit.jitTableEntriesUsed = 0;
for (i=0; i < oldSize; i++) {
if (pOldTable[i].dPC) {
JitEntry *p;
u2 chain;
p = lookupAndAdd(pOldTable[i].dPC, true /* holds tableLock*/,
pOldTable[i].u.info.isMethodEntry);
p->codeAddress = pOldTable[i].codeAddress;
/* We need to preserve the new chain field, but copy the rest */
chain = p->u.info.chain;
p->u = pOldTable[i].u;
p->u.info.chain = chain;
}
}
dvmUnlockMutex(&gDvmJit.tableLock);
free(pOldTable);
/* Restart the world */
dvmResumeAllThreads(SUSPEND_FOR_TBL_RESIZE);
return false;
}
/*
* Reset the JitTable to the initial clean state.
*/
void dvmJitResetTable()
{
JitEntry *jitEntry = gDvmJit.pJitEntryTable;
unsigned int size = gDvmJit.jitTableSize;
unsigned int i;
dvmLockMutex(&gDvmJit.tableLock);
/* Note: If need to preserve any existing counts. Do so here. */
if (gDvmJit.pJitTraceProfCounters) {
for (i=0; i < JIT_PROF_BLOCK_BUCKETS; i++) {
if (gDvmJit.pJitTraceProfCounters->buckets[i])
memset((void *) gDvmJit.pJitTraceProfCounters->buckets[i],
0, sizeof(JitTraceCounter_t) * JIT_PROF_BLOCK_ENTRIES);
}
gDvmJit.pJitTraceProfCounters->next = 0;
}
memset((void *) jitEntry, 0, sizeof(JitEntry) * size);
for (i=0; i< size; i++) {
jitEntry[i].u.info.chain = size; /* Initialize chain termination */
}
gDvmJit.jitTableEntriesUsed = 0;
dvmUnlockMutex(&gDvmJit.tableLock);
}
/*
* Return the address of the next trace profile counter. This address
* will be embedded in the generated code for the trace, and thus cannot
* change while the trace exists.
*/
JitTraceCounter_t *dvmJitNextTraceCounter()
{
int idx = gDvmJit.pJitTraceProfCounters->next / JIT_PROF_BLOCK_ENTRIES;
int elem = gDvmJit.pJitTraceProfCounters->next % JIT_PROF_BLOCK_ENTRIES;
JitTraceCounter_t *res;
/* Lazily allocate blocks of counters */
if (!gDvmJit.pJitTraceProfCounters->buckets[idx]) {
JitTraceCounter_t *p =
(JitTraceCounter_t*) calloc(JIT_PROF_BLOCK_ENTRIES, sizeof(*p));
if (!p) {
ALOGE("Failed to allocate block of trace profile counters");
dvmAbort();
}
gDvmJit.pJitTraceProfCounters->buckets[idx] = p;
}
res = &gDvmJit.pJitTraceProfCounters->buckets[idx][elem];
gDvmJit.pJitTraceProfCounters->next++;
return res;
}
/*
* Float/double conversion requires clamping to min and max of integer form. If
* target doesn't support this normally, use these.
*/
s8 dvmJitd2l(double d)
{
static const double kMaxLong = (double)(s8)0x7fffffffffffffffULL;
static const double kMinLong = (double)(s8)0x8000000000000000ULL;
if (d >= kMaxLong)
return (s8)0x7fffffffffffffffULL;
else if (d <= kMinLong)
return (s8)0x8000000000000000ULL;
else if (d != d) // NaN case
return 0;
else
return (s8)d;
}
s8 dvmJitf2l(float f)
{
static const float kMaxLong = (float)(s8)0x7fffffffffffffffULL;
static const float kMinLong = (float)(s8)0x8000000000000000ULL;
if (f >= kMaxLong)
return (s8)0x7fffffffffffffffULL;
else if (f <= kMinLong)
return (s8)0x8000000000000000ULL;
else if (f != f) // NaN case
return 0;
else
return (s8)f;
}
/* Should only be called by the compiler thread */
void dvmJitChangeProfileMode(TraceProfilingModes newState)
{
if (gDvmJit.profileMode != newState) {
gDvmJit.profileMode = newState;
dvmJitUnchainAll();
}
}
void dvmJitTraceProfilingOn()
{
if (gDvmJit.profileMode == kTraceProfilingPeriodicOff)
dvmCompilerForceWorkEnqueue(NULL, kWorkOrderProfileMode,
(void*) kTraceProfilingPeriodicOn);
else if (gDvmJit.profileMode == kTraceProfilingDisabled)
dvmCompilerForceWorkEnqueue(NULL, kWorkOrderProfileMode,
(void*) kTraceProfilingContinuous);
}
void dvmJitTraceProfilingOff()
{
if (gDvmJit.profileMode == kTraceProfilingPeriodicOn)
dvmCompilerForceWorkEnqueue(NULL, kWorkOrderProfileMode,
(void*) kTraceProfilingPeriodicOff);
else if (gDvmJit.profileMode == kTraceProfilingContinuous)
dvmCompilerForceWorkEnqueue(NULL, kWorkOrderProfileMode,
(void*) kTraceProfilingDisabled);
}
/*
* Update JIT-specific info in Thread structure for a single thread
*/
void dvmJitUpdateThreadStateSingle(Thread* thread)
{
thread->pJitProfTable = gDvmJit.pProfTable;
thread->jitThreshold = gDvmJit.threshold;
}
/*
* Walk through the thread list and refresh all local copies of
* JIT global state (which was placed there for fast access).
*/
void dvmJitUpdateThreadStateAll()
{
Thread* self = dvmThreadSelf();
Thread* thread;
dvmLockThreadList(self);
for (thread = gDvm.threadList; thread != NULL; thread = thread->next) {
dvmJitUpdateThreadStateSingle(thread);
}
dvmUnlockThreadList();
}
#endif /* WITH_JIT */