vm/analysis/DexVerify.c - platform/dalvik - Gitiles

 /*
  * Copyright (C) 2008 The Android Open Source Project
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 /*
  * Dalvik classfile verification.  This file contains the verifier entry
  * points and the static constraint checks.
  */
 #include "Dalvik.h"
 #include "analysis/CodeVerify.h"
 #include "libdex/DexCatch.h"


 /* fwd */
 static bool verifyMethod(Method* meth);
 static bool verifyInstructions(VerifierData* vdata);


 /*
  * Verify a class.
  *
  * By the time we get here, the value of gDvm.classVerifyMode should already
  * have been factored in.  If you want to call into the verifier even
  * though verification is disabled, that's your business.
  *
  * Returns "true" on success.
  */
 bool dvmVerifyClass(ClassObject* clazz)
 {
     int i;

     if (dvmIsClassVerified(clazz)) {
         LOGD("Ignoring duplicate verify attempt on %s\n", clazz->descriptor);
         return true;
     }

     for (i = 0; i < clazz->directMethodCount; i++) {
         if (!verifyMethod(&clazz->directMethods[i])) {
             LOG_VFY("Verifier rejected class %s\n", clazz->descriptor);
             return false;
         }
     }
     for (i = 0; i < clazz->virtualMethodCount; i++) {
         if (!verifyMethod(&clazz->virtualMethods[i])) {
             LOG_VFY("Verifier rejected class %s\n", clazz->descriptor);
             return false;
         }
     }

     return true;
 }


 /*
  * Compute the width of the instruction at each address in the instruction
  * stream, and store it in vdata->insnFlags.  Addresses that are in the
  * middle of an instruction, or that are part of switch table data, are not
  * touched (so the caller should probably initialize "insnFlags" to zero).
  *
  * The "newInstanceCount" and "monitorEnterCount" fields in vdata are
  * also set.
  *
  * Performs some static checks, notably:
  * - opcode of first instruction begins at index 0
  * - only documented instructions may appear
  * - each instruction follows the last
  * - last byte of last instruction is at (code_length-1)
  *
  * Logs an error and returns "false" on failure.
  */
 static bool computeWidthsAndCountOps(VerifierData* vdata)
 {
     const Method* meth = vdata->method;
     InsnFlags* insnFlags = vdata->insnFlags;
     size_t insnCount = vdata->insnsSize;
     const u2* insns = meth->insns;
     bool result = false;
     int newInstanceCount = 0;
     int monitorEnterCount = 0;
     int i;

     for (i = 0; i < (int) insnCount; /**/) {
         size_t width = dexGetInstrOrTableWidth(insns);
         if (width == 0) {
             LOG_VFY_METH(meth, "VFY: invalid instruction (0x%04x)\n", *insns);
             goto bail;
         }

         if ((*insns & 0xff) == OP_NEW_INSTANCE)
             newInstanceCount++;
         if ((*insns & 0xff) == OP_MONITOR_ENTER)
             monitorEnterCount++;

         if (width > 65535) {
             LOG_VFY_METH(meth, "VFY: insane width %d\n", width);
             goto bail;
         }

         insnFlags[i] |= width;
         i += width;
         insns += width;
     }
     if (i != (int) dvmGetMethodInsnsSize(meth)) {
         LOG_VFY_METH(meth, "VFY: code did not end where expected (%d vs. %d)\n",
             i, dvmGetMethodInsnsSize(meth));
         goto bail;
     }

     result = true;
     vdata->newInstanceCount = newInstanceCount;
     vdata->monitorEnterCount = monitorEnterCount;

 bail:
     return result;
 }

 /*
  * Set the "in try" flags for all instructions protected by "try" statements.
  * Also sets the "branch target" flags for exception handlers.
  *
  * Call this after widths have been set in "insnFlags".
  *
  * Returns "false" if something in the exception table looks fishy, but
  * we're expecting the exception table to be somewhat sane.
  */
 static bool scanTryCatchBlocks(const Method* meth, InsnFlags* insnFlags)
 {
     u4 insnsSize = dvmGetMethodInsnsSize(meth);
     const DexCode* pCode = dvmGetMethodCode(meth);
     u4 triesSize = pCode->triesSize;
     const DexTry* pTries;
     u4 handlersSize;
     u4 offset;
     u4 i;

     if (triesSize == 0) {
         return true;
     }

     pTries = dexGetTries(pCode);
     handlersSize = dexGetHandlersSize(pCode);

     for (i = 0; i < triesSize; i++) {
         const DexTry* pTry = &pTries[i];
         u4 start = pTry->startAddr;
         u4 end = start + pTry->insnCount;
         u4 addr;

         if ((start >= end) || (start >= insnsSize) || (end > insnsSize)) {
             LOG_VFY_METH(meth,
                 "VFY: bad exception entry: startAddr=%d endAddr=%d (size=%d)\n",
                 start, end, insnsSize);
             return false;
         }

         if (dvmInsnGetWidth(insnFlags, start) == 0) {
             LOG_VFY_METH(meth,
                 "VFY: 'try' block starts inside an instruction (%d)\n",
                 start);
             return false;
         }

         for (addr = start; addr < end;
             addr += dvmInsnGetWidth(insnFlags, addr))
         {
             assert(dvmInsnGetWidth(insnFlags, addr) != 0);
             dvmInsnSetInTry(insnFlags, addr, true);
         }
     }

     /* Iterate over each of the handlers to verify target addresses. */
     offset = dexGetFirstHandlerOffset(pCode);
     for (i = 0; i < handlersSize; i++) {
         DexCatchIterator iterator;
         dexCatchIteratorInit(&iterator, pCode, offset);

         for (;;) {
             DexCatchHandler* handler = dexCatchIteratorNext(&iterator);
             u4 addr;

             if (handler == NULL) {
                 break;
             }

             addr = handler->address;
             if (dvmInsnGetWidth(insnFlags, addr) == 0) {
                 LOG_VFY_METH(meth,
                     "VFY: exception handler starts at bad address (%d)\n",
                     addr);
                 return false;
             }

             dvmInsnSetBranchTarget(insnFlags, addr, true);
         }

         offset = dexCatchIteratorGetEndOffset(&iterator, pCode);
     }

     return true;
 }

 /*
  * Perform verification on a single method.
  *
  * We do this in three passes:
  *  (1) Walk through all code units, determining instruction locations,
  *      widths, and other characteristics.
  *  (2) Walk through all code units, performing static checks on
  *      operands.
  *  (3) Iterate through the method, checking type safety and looking
  *      for code flow problems.
  *
  * Some checks may be bypassed depending on the verification mode.  We can't
  * turn this stuff off completely if we want to do "exact" GC.
  *
  * TODO: cite source?
  * Confirmed here:
  * - code array must not be empty
  * - (N/A) code_length must be less than 65536
  * Confirmed by computeWidthsAndCountOps():
  * - opcode of first instruction begins at index 0
  * - only documented instructions may appear
  * - each instruction follows the last
  * - last byte of last instruction is at (code_length-1)
  */
 static bool verifyMethod(Method* meth)
 {
     bool result = false;

     /*
      * Verifier state blob.  Various values will be cached here so we
      * can avoid expensive lookups and pass fewer arguments around.
      */
     VerifierData vdata;
 #if 1   // ndef NDEBUG
     memset(&vdata, 0x99, sizeof(vdata));
 #endif

     vdata.method = meth;
     vdata.insnsSize = dvmGetMethodInsnsSize(meth);
     vdata.insnRegCount = meth->registersSize;
     vdata.insnFlags = NULL;
     vdata.uninitMap = NULL;

     /*
      * If there aren't any instructions, make sure that's expected, then
      * exit successfully.  Note: for native methods, meth->insns gets set
      * to a native function pointer on first call, so don't use that as
      * an indicator.
      */
     if (vdata.insnsSize == 0) {
         if (!dvmIsNativeMethod(meth) && !dvmIsAbstractMethod(meth)) {
             LOG_VFY_METH(meth,
                 "VFY: zero-length code in concrete non-native method\n");
             goto bail;
         }

         goto success;
     }

     /*
      * Sanity-check the register counts.  ins + locals = registers, so make
      * sure that ins <= registers.
      */
     if (meth->insSize > meth->registersSize) {
         LOG_VFY_METH(meth, "VFY: bad register counts (ins=%d regs=%d)\n",
             meth->insSize, meth->registersSize);
         goto bail;
     }

     /*
      * Allocate and populate an array to hold instruction data.
      *
      * TODO: Consider keeping a reusable pre-allocated array sitting
      * around for smaller methods.
      */
     vdata.insnFlags = (InsnFlags*)
         calloc(dvmGetMethodInsnsSize(meth), sizeof(InsnFlags));
     if (vdata.insnFlags == NULL)
         goto bail;

     /*
      * Compute the width of each instruction and store the result in insnFlags.
      * Count up the #of occurrences of certain opcodes while we're at it.
      */
     if (!computeWidthsAndCountOps(&vdata))
         goto bail;

     /*
      * Allocate a map to hold the classes of uninitialized instances.
      */
     vdata.uninitMap = dvmCreateUninitInstanceMap(meth, vdata.insnFlags,
         vdata.newInstanceCount);
     if (vdata.uninitMap == NULL)
         goto bail;

     /*
      * Set the "in try" flags for all instructions guarded by a "try" block.
      */
     if (!scanTryCatchBlocks(meth, vdata.insnFlags))
         goto bail;

     /*
      * Perform static instruction verification.
      */
     if (!verifyInstructions(&vdata))
         goto bail;

     /*
      * Do code-flow analysis.
      *
      * We could probably skip this for a method with no registers, but
      * that's so rare that there's little point in checking.
      */
     if (!dvmVerifyCodeFlow(&vdata)) {
         //LOGD("+++ %s failed code flow\n", meth->name);
         goto bail;
     }

 success:
     result = true;

 bail:
     dvmFreeUninitInstanceMap(vdata.uninitMap);
     free(vdata.insnFlags);
     return result;
 }


 /*
  * Verify an array data table.  "curOffset" is the offset of the
  * fill-array-data instruction.
  */
 static bool checkArrayData(const Method* meth, u4 curOffset)
 {
     const u4 insnCount = dvmGetMethodInsnsSize(meth);
     const u2* insns = meth->insns + curOffset;
     const u2* arrayData;
     u4 valueCount, valueWidth, tableSize;
     s4 offsetToArrayData;

     assert(curOffset < insnCount);

     /* make sure the start of the array data table is in range */
     offsetToArrayData = insns[1] | (((s4)insns[2]) << 16);
     if ((s4)curOffset + offsetToArrayData < 0 ||
         curOffset + offsetToArrayData + 2 >= insnCount)
     {
         LOG_VFY("VFY: invalid array data start: at %d, data offset %d, "
                 "count %d\n",
             curOffset, offsetToArrayData, insnCount);
         return false;
     }

     /* offset to array data table is a relative branch-style offset */
     arrayData = insns + offsetToArrayData;

     /* make sure the table is 32-bit aligned */
     if ((((u4) arrayData) & 0x03) != 0) {
         LOG_VFY("VFY: unaligned array data table: at %d, data offset %d\n",
             curOffset, offsetToArrayData);
         return false;
     }

     valueWidth = arrayData[1];
     valueCount = *(u4*)(&arrayData[2]);

     tableSize = 4 + (valueWidth * valueCount + 1) / 2;

     /* make sure the end of the switch is in range */
     if (curOffset + offsetToArrayData + tableSize > insnCount) {
         LOG_VFY("VFY: invalid array data end: at %d, data offset %d, end %d, "
                 "count %d\n",
             curOffset, offsetToArrayData,
             curOffset + offsetToArrayData + tableSize, insnCount);
         return false;
     }

     return true;
 }

 /*
  * Perform static checks on a "new-instance" instruction.  Specifically,
  * make sure the class reference isn't for an array class.
  *
  * We don't need the actual class, just a pointer to the class name.
  */
 static bool checkNewInstance(const DvmDex* pDvmDex, u4 idx)
 {
     const char* classDescriptor;

     if (idx >= pDvmDex->pHeader->typeIdsSize) {
         LOG_VFY("VFY: bad type index %d (max %d)\n",
             idx, pDvmDex->pHeader->typeIdsSize);
         return false;
     }

     classDescriptor = dexStringByTypeIdx(pDvmDex->pDexFile, idx);
     if (classDescriptor[0] != 'L') {
         LOG_VFY("VFY: can't call new-instance on type '%s'\n",
             classDescriptor);
         return false;
     }

     return true;
 }

 /*
  * Perform static checks on a "new-array" instruction.  Specifically, make
  * sure they aren't creating an array of arrays that causes the number of
  * dimensions to exceed 255.
  */
 static bool checkNewArray(const DvmDex* pDvmDex, u4 idx)
 {
     const char* classDescriptor;

     if (idx >= pDvmDex->pHeader->typeIdsSize) {
         LOG_VFY("VFY: bad type index %d (max %d)\n",
             idx, pDvmDex->pHeader->typeIdsSize);
         return false;
     }

     classDescriptor = dexStringByTypeIdx(pDvmDex->pDexFile, idx);

     int bracketCount = 0;
     const char* cp = classDescriptor;
     while (*cp++ == '[')
         bracketCount++;

     if (bracketCount == 0) {
         /* The given class must be an array type. */
         LOG_VFY("VFY: can't new-array class '%s' (not an array)\n",
             classDescriptor);
         return false;
     } else if (bracketCount > 255) {
         /* It is illegal to create an array of more than 255 dimensions. */
         LOG_VFY("VFY: can't new-array class '%s' (exceeds limit)\n",
             classDescriptor);
         return false;
     }

     return true;
 }

 /*
  * Perform static checks on an instruction that takes a class constant.
  * Ensure that the class index is in the valid range.
  */
 static bool checkTypeIndex(const DvmDex* pDvmDex, u4 idx)
 {
     if (idx >= pDvmDex->pHeader->typeIdsSize) {
         LOG_VFY("VFY: bad type index %d (max %d)\n",
             idx, pDvmDex->pHeader->typeIdsSize);
         return false;
     }
     return true;
 }

 /*
  * Perform static checks on a field get or set instruction.  All we do
  * here is ensure that the field index is in the valid range.
  */
 static bool checkFieldIndex(const DvmDex* pDvmDex, u4 idx)
 {
     if (idx >= pDvmDex->pHeader->fieldIdsSize) {
         LOG_VFY("VFY: bad field index %d (max %d)\n",
             idx, pDvmDex->pHeader->fieldIdsSize);
         return false;
     }
     return true;
 }

 /*
  * Perform static checks on a method invocation instruction.  All we do
  * here is ensure that the method index is in the valid range.
  */
 static bool checkMethodIndex(const DvmDex* pDvmDex, u4 idx)
 {
     if (idx >= pDvmDex->pHeader->methodIdsSize) {
         LOG_VFY("VFY: bad method index %d (max %d)\n",
             idx, pDvmDex->pHeader->methodIdsSize);
         return false;
     }
     return true;
 }

 /*
  * Ensure that the string index is in the valid range.
  */
 static bool checkStringIndex(const DvmDex* pDvmDex, u4 idx)
 {
     if (idx >= pDvmDex->pHeader->stringIdsSize) {
         LOG_VFY("VFY: bad string index %d (max %d)\n",
             idx, pDvmDex->pHeader->stringIdsSize);
         return false;
     }
     return true;
 }

 /*
  * Ensure that the register index is valid for this method.
  */
 static bool checkRegisterIndex(const Method* meth, u4 idx)
 {
     if (idx >= meth->registersSize) {
         LOG_VFY("VFY: register index out of range (%d >= %d)\n",
             idx, meth->registersSize);
         return false;
     }
     return true;
 }

 /*
  * Ensure that the wide register index is valid for this method.
  */
 static bool checkWideRegisterIndex(const Method* meth, u4 idx)
 {
     if (idx+1 >= meth->registersSize) {
         LOG_VFY("VFY: wide register index out of range (%d+1 >= %d)\n",
             idx, meth->registersSize);
         return false;
     }
     return true;
 }

 /*
  * Check the register indices used in a "vararg" instruction, such as
  * invoke-virtual or filled-new-array.
  *
  * vA holds word count (0-5), args[] have values.
  *
  * There are some tests we don't do here, e.g. we don't try to verify
  * that invoking a method that takes a double is done with consecutive
  * registers.  This requires parsing the target method signature, which
  * we will be doing later on during the code flow analysis.
  */
 static bool checkVarargRegs(const Method* meth,
     const DecodedInstruction* pDecInsn)
 {
     u2 registersSize = meth->registersSize;
     unsigned int idx;

     if (pDecInsn->vA > 5) {
         LOG_VFY("VFY: invalid arg count (%d) in non-range invoke)\n",
             pDecInsn->vA);
         return false;
     }

     for (idx = 0; idx < pDecInsn->vA; idx++) {
         if (pDecInsn->arg[idx] > registersSize) {
             LOG_VFY("VFY: invalid reg index (%d) in non-range invoke (> %d)\n",
                 pDecInsn->arg[idx], registersSize);
             return false;
         }
     }

     return true;
 }

 /*
  * Check the register indices used in a "vararg/range" instruction, such as
  * invoke-virtual/range or filled-new-array/range.
  *
  * vA holds word count, vC holds index of first reg.
  */
 static bool checkVarargRangeRegs(const Method* meth,
     const DecodedInstruction* pDecInsn)
 {
     u2 registersSize = meth->registersSize;

     /*
      * vA/vC are unsigned 8-bit/16-bit quantities for /range instructions,
      * so there's no risk of integer overflow when adding them here.
      */
     if (pDecInsn->vA + pDecInsn->vC > registersSize) {
         LOG_VFY("VFY: invalid reg index %d+%d in range invoke (> %d)\n",
             pDecInsn->vA, pDecInsn->vC, registersSize);
         return false;
     }

     return true;
 }

 /*
  * Verify a switch table.  "curOffset" is the offset of the switch
  * instruction.
  *
  * Updates "insnFlags", setting the "branch target" flag.
  */
 static bool checkSwitchTargets(const Method* meth, InsnFlags* insnFlags,
     u4 curOffset)
 {
     const u4 insnCount = dvmGetMethodInsnsSize(meth);
     const u2* insns = meth->insns + curOffset;
     const u2* switchInsns;
     u2 expectedSignature;
     u4 switchCount, tableSize;
     s4 offsetToSwitch, offsetToKeys, offsetToTargets;
     s4 offset, absOffset;
     u4 targ;

     assert(curOffset < insnCount);

     /* make sure the start of the switch is in range */
     offsetToSwitch = insns[1] | ((s4) insns[2]) << 16;
     if ((s4) curOffset + offsetToSwitch < 0 ||
         curOffset + offsetToSwitch + 2 >= insnCount)
     {
         LOG_VFY("VFY: invalid switch start: at %d, switch offset %d, "
                 "count %d\n",
             curOffset, offsetToSwitch, insnCount);
         return false;
     }

     /* offset to switch table is a relative branch-style offset */
     switchInsns = insns + offsetToSwitch;

     /* make sure the table is 32-bit aligned */
     if ((((u4) switchInsns) & 0x03) != 0) {
         LOG_VFY("VFY: unaligned switch table: at %d, switch offset %d\n",
             curOffset, offsetToSwitch);
         return false;
     }

     switchCount = switchInsns[1];

     if ((*insns & 0xff) == OP_PACKED_SWITCH) {
         /* 0=sig, 1=count, 2/3=firstKey */
         offsetToTargets = 4;
         offsetToKeys = -1;
         expectedSignature = kPackedSwitchSignature;
     } else {
         /* 0=sig, 1=count, 2..count*2 = keys */
         offsetToKeys = 2;
         offsetToTargets = 2 + 2*switchCount;
         expectedSignature = kSparseSwitchSignature;
     }
     tableSize = offsetToTargets + switchCount*2;

     if (switchInsns[0] != expectedSignature) {
         LOG_VFY("VFY: wrong signature for switch table (0x%04x, wanted 0x%04x)\n",
             switchInsns[0], expectedSignature);
         return false;
     }

     /* make sure the end of the switch is in range */
     if (curOffset + offsetToSwitch + tableSize > (u4) insnCount) {
         LOG_VFY("VFY: invalid switch end: at %d, switch offset %d, end %d, "
                 "count %d\n",
             curOffset, offsetToSwitch, curOffset + offsetToSwitch + tableSize,
             insnCount);
         return false;
     }

     /* for a sparse switch, verify the keys are in ascending order */
     if (offsetToKeys > 0 && switchCount > 1) {
         s4 lastKey;

         lastKey = switchInsns[offsetToKeys] |
                   (switchInsns[offsetToKeys+1] << 16);
         for (targ = 1; targ < switchCount; targ++) {
             s4 key = (s4) switchInsns[offsetToKeys + targ*2] |
                     (s4) (switchInsns[offsetToKeys + targ*2 +1] << 16);
             if (key <= lastKey) {
                 LOG_VFY("VFY: invalid packed switch: last key=%d, this=%d\n",
                     lastKey, key);
                 return false;
             }

             lastKey = key;
         }
     }

     /* verify each switch target */
     for (targ = 0; targ < switchCount; targ++) {
         offset = (s4) switchInsns[offsetToTargets + targ*2] |
                 (s4) (switchInsns[offsetToTargets + targ*2 +1] << 16);
         absOffset = curOffset + offset;

         if (absOffset < 0 || absOffset >= (s4)insnCount ||
             !dvmInsnIsOpcode(insnFlags, absOffset))
         {
             LOG_VFY("VFY: invalid switch target %d (-> 0x%x) at 0x%x[%d]\n",
                 offset, absOffset, curOffset, targ);
             return false;
         }
         dvmInsnSetBranchTarget(insnFlags, absOffset, true);
     }

     return true;
 }

 /*
  * Verify that the target of a branch instruction is valid.
  *
  * We don't expect code to jump directly into an exception handler, but
  * it's valid to do so as long as the target isn't a "move-exception"
  * instruction.  We verify that in a later stage.
  *
  * The VM spec doesn't forbid an instruction from branching to itself,
  * but the Dalvik spec declares that only certain instructions can do so.
  *
  * Updates "insnFlags", setting the "branch target" flag.
  */
 static bool checkBranchTarget(const Method* meth, InsnFlags* insnFlags,
     int curOffset, bool selfOkay)
 {
     const int insnCount = dvmGetMethodInsnsSize(meth);
     int offset, absOffset;
     bool isConditional;

     if (!dvmGetBranchTarget(meth, insnFlags, curOffset, &offset,
             &isConditional))
         return false;

     if (!selfOkay && offset == 0) {
         LOG_VFY_METH(meth, "VFY: branch offset of zero not allowed at 0x%x\n",
             curOffset);
         return false;
     }

     /*
      * Check for 32-bit overflow.  This isn't strictly necessary if we can
      * depend on the VM to have identical "wrap-around" behavior, but
      * it's unwise to depend on that.
      */
     if (((s8) curOffset + (s8) offset) != (s8)(curOffset + offset)) {
         LOG_VFY_METH(meth, "VFY: branch target overflow 0x%x +%d\n",
             curOffset, offset);
         return false;
     }
     absOffset = curOffset + offset;
     if (absOffset < 0 || absOffset >= insnCount ||
         !dvmInsnIsOpcode(insnFlags, absOffset))
     {
         LOG_VFY_METH(meth,
             "VFY: invalid branch target %d (-> 0x%x) at 0x%x\n",
             offset, absOffset, curOffset);
         return false;
     }
     dvmInsnSetBranchTarget(insnFlags, absOffset, true);

     return true;
 }


 /*
  * Perform static verification on instructions.
  *
  * As a side effect, this sets the "branch target" flags in InsnFlags.
  *
  * "(CF)" items are handled during code-flow analysis.
  *
  * v3 4.10.1
  * - target of each jump and branch instruction must be valid
  * - targets of switch statements must be valid
  * - operands referencing constant pool entries must be valid
  * - (CF) operands of getfield, putfield, getstatic, putstatic must be valid
  * - (new) verify operands of "quick" field ops
  * - (CF) operands of method invocation instructions must be valid
  * - (new) verify operands of "quick" method invoke ops
  * - (CF) only invoke-direct can call a method starting with '<'
  * - (CF) <clinit> must never be called explicitly
  * - operands of instanceof, checkcast, new (and variants) must be valid
  * - new-array[-type] limited to 255 dimensions
  * - can't use "new" on an array class
  * - (?) limit dimensions in multi-array creation
  * - local variable load/store register values must be in valid range
  *
  * v3 4.11.1.2
  * - branches must be within the bounds of the code array
  * - targets of all control-flow instructions are the start of an instruction
  * - register accesses fall within range of allocated registers
  * - (N/A) access to constant pool must be of appropriate type
  * - code does not end in the middle of an instruction
  * - execution cannot fall off the end of the code
  * - (earlier) for each exception handler, the "try" area must begin and
  *   end at the start of an instruction (end can be at the end of the code)
  * - (earlier) for each exception handler, the handler must start at a valid
  *   instruction
  */
 static bool verifyInstructions(VerifierData* vdata)
 {
     const Method* meth = vdata->method;
     const DvmDex* pDvmDex = meth->clazz->pDvmDex;
     InsnFlags* insnFlags = vdata->insnFlags;
     const u2* insns = meth->insns;
     unsigned int codeOffset;

     /* the start of the method is a "branch target" */
     dvmInsnSetBranchTarget(insnFlags, 0, true);

     for (codeOffset = 0; codeOffset < vdata->insnsSize; /**/) {
         /*
          * Pull the instruction apart.
          */
         int width = dvmInsnGetWidth(insnFlags, codeOffset);
         DecodedInstruction decInsn;
         bool okay = true;

         dexDecodeInstruction(meth->insns + codeOffset, &decInsn);

         /*
          * Check register, type, class, field, method, and string indices
          * for out-of-range values.  Do additional checks on branch targets
          * and some special cases like new-instance and new-array.
          */
         switch (decInsn.opCode) {
         case OP_NOP:
         case OP_RETURN_VOID:
             /* nothing to check */
             break;
         case OP_MOVE_RESULT:
         case OP_MOVE_RESULT_OBJECT:
         case OP_MOVE_EXCEPTION:
         case OP_RETURN:
         case OP_RETURN_OBJECT:
         case OP_CONST_4:
         case OP_CONST_16:
         case OP_CONST:
         case OP_CONST_HIGH16:
         case OP_MONITOR_ENTER:
         case OP_MONITOR_EXIT:
         case OP_THROW:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             break;
         case OP_MOVE_RESULT_WIDE:
         case OP_RETURN_WIDE:
         case OP_CONST_WIDE_16:
         case OP_CONST_WIDE_32:
         case OP_CONST_WIDE:
         case OP_CONST_WIDE_HIGH16:
             okay &= checkWideRegisterIndex(meth, decInsn.vA);
             break;
         case OP_GOTO:
         case OP_GOTO_16:
             okay &= checkBranchTarget(meth, insnFlags, codeOffset, false);
             break;
         case OP_GOTO_32:
             okay &= checkBranchTarget(meth, insnFlags, codeOffset, true);
             break;
         case OP_MOVE:
         case OP_MOVE_FROM16:
         case OP_MOVE_16:
         case OP_MOVE_OBJECT:
         case OP_MOVE_OBJECT_FROM16:
         case OP_MOVE_OBJECT_16:
         case OP_ARRAY_LENGTH:
         case OP_NEG_INT:
         case OP_NOT_INT:
         case OP_NEG_FLOAT:
         case OP_INT_TO_FLOAT:
         case OP_FLOAT_TO_INT:
         case OP_INT_TO_BYTE:
         case OP_INT_TO_CHAR:
         case OP_INT_TO_SHORT:
         case OP_ADD_INT_2ADDR:
         case OP_SUB_INT_2ADDR:
         case OP_MUL_INT_2ADDR:
         case OP_DIV_INT_2ADDR:
         case OP_REM_INT_2ADDR:
         case OP_AND_INT_2ADDR:
         case OP_OR_INT_2ADDR:
         case OP_XOR_INT_2ADDR:
         case OP_SHL_INT_2ADDR:
         case OP_SHR_INT_2ADDR:
         case OP_USHR_INT_2ADDR:
         case OP_ADD_FLOAT_2ADDR:
         case OP_SUB_FLOAT_2ADDR:
         case OP_MUL_FLOAT_2ADDR:
         case OP_DIV_FLOAT_2ADDR:
         case OP_REM_FLOAT_2ADDR:
         case OP_ADD_INT_LIT16:
         case OP_RSUB_INT:
         case OP_MUL_INT_LIT16:
         case OP_DIV_INT_LIT16:
         case OP_REM_INT_LIT16:
         case OP_AND_INT_LIT16:
         case OP_OR_INT_LIT16:
         case OP_XOR_INT_LIT16:
         case OP_ADD_INT_LIT8:
         case OP_RSUB_INT_LIT8:
         case OP_MUL_INT_LIT8:
         case OP_DIV_INT_LIT8:
         case OP_REM_INT_LIT8:
         case OP_AND_INT_LIT8:
         case OP_OR_INT_LIT8:
         case OP_XOR_INT_LIT8:
         case OP_SHL_INT_LIT8:
         case OP_SHR_INT_LIT8:
         case OP_USHR_INT_LIT8:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkRegisterIndex(meth, decInsn.vB);
             break;
         case OP_INT_TO_LONG:
         case OP_INT_TO_DOUBLE:
         case OP_FLOAT_TO_LONG:
         case OP_FLOAT_TO_DOUBLE:
         case OP_SHL_LONG_2ADDR:
         case OP_SHR_LONG_2ADDR:
         case OP_USHR_LONG_2ADDR:
             okay &= checkWideRegisterIndex(meth, decInsn.vA);
             okay &= checkRegisterIndex(meth, decInsn.vB);
             break;
         case OP_LONG_TO_INT:
         case OP_LONG_TO_FLOAT:
         case OP_DOUBLE_TO_INT:
         case OP_DOUBLE_TO_FLOAT:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkWideRegisterIndex(meth, decInsn.vB);
             break;
         case OP_MOVE_WIDE:
         case OP_MOVE_WIDE_FROM16:
         case OP_MOVE_WIDE_16:
         case OP_DOUBLE_TO_LONG:
         case OP_LONG_TO_DOUBLE:
         case OP_NEG_DOUBLE:
         case OP_NEG_LONG:
         case OP_NOT_LONG:
         case OP_ADD_LONG_2ADDR:
         case OP_SUB_LONG_2ADDR:
         case OP_MUL_LONG_2ADDR:
         case OP_DIV_LONG_2ADDR:
         case OP_REM_LONG_2ADDR:
         case OP_AND_LONG_2ADDR:
         case OP_OR_LONG_2ADDR:
         case OP_XOR_LONG_2ADDR:
         case OP_ADD_DOUBLE_2ADDR:
         case OP_SUB_DOUBLE_2ADDR:
         case OP_MUL_DOUBLE_2ADDR:
         case OP_DIV_DOUBLE_2ADDR:
         case OP_REM_DOUBLE_2ADDR:
             okay &= checkWideRegisterIndex(meth, decInsn.vA);
             okay &= checkWideRegisterIndex(meth, decInsn.vB);
             break;
         case OP_CONST_STRING:
         case OP_CONST_STRING_JUMBO:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkStringIndex(pDvmDex, decInsn.vB);
             break;
         case OP_CONST_CLASS:
         case OP_CHECK_CAST:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkTypeIndex(pDvmDex, decInsn.vB);
             break;
         case OP_INSTANCE_OF:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkRegisterIndex(meth, decInsn.vB);
             okay &= checkTypeIndex(pDvmDex, decInsn.vC);
             break;
         case OP_NEW_INSTANCE:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkNewInstance(pDvmDex, decInsn.vB);
             break;
         case OP_NEW_ARRAY:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkRegisterIndex(meth, decInsn.vB);
             okay &= checkNewArray(pDvmDex, decInsn.vC);
             break;
         case OP_FILL_ARRAY_DATA:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkArrayData(meth, codeOffset);
             break;
         case OP_PACKED_SWITCH:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkSwitchTargets(meth, insnFlags, codeOffset);
             break;
         case OP_SPARSE_SWITCH:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkSwitchTargets(meth, insnFlags, codeOffset);
             break;
         case OP_CMPL_FLOAT:
         case OP_CMPG_FLOAT:
         case OP_AGET:
         case OP_AGET_OBJECT:
         case OP_AGET_BOOLEAN:
         case OP_AGET_BYTE:
         case OP_AGET_CHAR:
         case OP_AGET_SHORT:
         case OP_APUT:
         case OP_APUT_OBJECT:
         case OP_APUT_BOOLEAN:
         case OP_APUT_BYTE:
         case OP_APUT_CHAR:
         case OP_APUT_SHORT:
         case OP_ADD_INT:
         case OP_SUB_INT:
         case OP_MUL_INT:
         case OP_DIV_INT:
         case OP_REM_INT:
         case OP_AND_INT:
         case OP_OR_INT:
         case OP_XOR_INT:
         case OP_SHL_INT:
         case OP_SHR_INT:
         case OP_USHR_INT:
         case OP_ADD_FLOAT:
         case OP_SUB_FLOAT:
         case OP_MUL_FLOAT:
         case OP_DIV_FLOAT:
         case OP_REM_FLOAT:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkRegisterIndex(meth, decInsn.vB);
             okay &= checkRegisterIndex(meth, decInsn.vC);
             break;
         case OP_AGET_WIDE:
         case OP_APUT_WIDE:
             okay &= checkWideRegisterIndex(meth, decInsn.vA);
             okay &= checkRegisterIndex(meth, decInsn.vB);
             okay &= checkRegisterIndex(meth, decInsn.vC);
             break;
         case OP_CMPL_DOUBLE:
         case OP_CMPG_DOUBLE:
         case OP_CMP_LONG:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkWideRegisterIndex(meth, decInsn.vB);
             okay &= checkWideRegisterIndex(meth, decInsn.vC);
             break;
         case OP_ADD_DOUBLE:
         case OP_SUB_DOUBLE:
         case OP_MUL_DOUBLE:
         case OP_DIV_DOUBLE:
         case OP_REM_DOUBLE:
         case OP_ADD_LONG:
         case OP_SUB_LONG:
         case OP_MUL_LONG:
         case OP_DIV_LONG:
         case OP_REM_LONG:
         case OP_AND_LONG:
         case OP_OR_LONG:
         case OP_XOR_LONG:
             okay &= checkWideRegisterIndex(meth, decInsn.vA);
             okay &= checkWideRegisterIndex(meth, decInsn.vB);
             okay &= checkWideRegisterIndex(meth, decInsn.vC);
             break;
         case OP_SHL_LONG:
         case OP_SHR_LONG:
         case OP_USHR_LONG:
             okay &= checkWideRegisterIndex(meth, decInsn.vA);
             okay &= checkWideRegisterIndex(meth, decInsn.vB);
             okay &= checkRegisterIndex(meth, decInsn.vC);
             break;
         case OP_IF_EQ:
         case OP_IF_NE:
         case OP_IF_LT:
         case OP_IF_GE:
         case OP_IF_GT:
         case OP_IF_LE:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkRegisterIndex(meth, decInsn.vB);
             okay &= checkBranchTarget(meth, insnFlags, codeOffset, false);
             break;
         case OP_IF_EQZ:
         case OP_IF_NEZ:
         case OP_IF_LTZ:
         case OP_IF_GEZ:
         case OP_IF_GTZ:
         case OP_IF_LEZ:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkBranchTarget(meth, insnFlags, codeOffset, false);
             break;
         case OP_IGET:
         case OP_IGET_OBJECT:
         case OP_IGET_BOOLEAN:
         case OP_IGET_BYTE:
         case OP_IGET_CHAR:
         case OP_IGET_SHORT:
         case OP_IPUT:
         case OP_IPUT_OBJECT:
         case OP_IPUT_BOOLEAN:
         case OP_IPUT_BYTE:
         case OP_IPUT_CHAR:
         case OP_IPUT_SHORT:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkRegisterIndex(meth, decInsn.vB);
             okay &= checkFieldIndex(pDvmDex, decInsn.vC);
             break;
         case OP_IGET_WIDE:
         case OP_IPUT_WIDE:
             okay &= checkWideRegisterIndex(meth, decInsn.vA);
             okay &= checkRegisterIndex(meth, decInsn.vB);
             okay &= checkFieldIndex(pDvmDex, decInsn.vC);
             break;
         case OP_SGET:
         case OP_SGET_OBJECT:
         case OP_SGET_BOOLEAN:
         case OP_SGET_BYTE:
         case OP_SGET_CHAR:
         case OP_SGET_SHORT:
         case OP_SPUT:
         case OP_SPUT_OBJECT:
         case OP_SPUT_BOOLEAN:
         case OP_SPUT_BYTE:
         case OP_SPUT_CHAR:
         case OP_SPUT_SHORT:
             okay &= checkRegisterIndex(meth, decInsn.vA);
             okay &= checkFieldIndex(pDvmDex, decInsn.vB);
             break;
         case OP_SGET_WIDE:
         case OP_SPUT_WIDE:
             okay &= checkWideRegisterIndex(meth, decInsn.vA);
             okay &= checkFieldIndex(pDvmDex, decInsn.vB);
             break;
         case OP_FILLED_NEW_ARRAY:
             /* decoder uses B, not C, for type ref */
             okay &= checkTypeIndex(pDvmDex, decInsn.vB);
             okay &= checkVarargRegs(meth, &decInsn);
             break;
         case OP_FILLED_NEW_ARRAY_RANGE:
             okay &= checkTypeIndex(pDvmDex, decInsn.vB);
             okay &= checkVarargRangeRegs(meth, &decInsn);
             break;
         case OP_INVOKE_VIRTUAL:
         case OP_INVOKE_SUPER:
         case OP_INVOKE_DIRECT:
         case OP_INVOKE_STATIC:
         case OP_INVOKE_INTERFACE:
             /* decoder uses B, not C, for type ref */
             okay &= checkMethodIndex(pDvmDex, decInsn.vB);
             okay &= checkVarargRegs(meth, &decInsn);
             break;
         case OP_INVOKE_VIRTUAL_RANGE:
         case OP_INVOKE_SUPER_RANGE:
         case OP_INVOKE_DIRECT_RANGE:
         case OP_INVOKE_STATIC_RANGE:
         case OP_INVOKE_INTERFACE_RANGE:
             okay &= checkMethodIndex(pDvmDex, decInsn.vB);
             okay &= checkVarargRangeRegs(meth, &decInsn);
             break;

         /* verifier/optimizer output; we should never see these */
         case OP_IGET_VOLATILE:
         case OP_IPUT_VOLATILE:
         case OP_SGET_VOLATILE:
         case OP_SPUT_VOLATILE:
         case OP_IGET_OBJECT_VOLATILE:
         case OP_IPUT_OBJECT_VOLATILE:
         case OP_SGET_OBJECT_VOLATILE:
         case OP_SPUT_OBJECT_VOLATILE:
         case OP_IGET_WIDE_VOLATILE:
         case OP_IPUT_WIDE_VOLATILE:
         case OP_SGET_WIDE_VOLATILE:
         case OP_SPUT_WIDE_VOLATILE:
         case OP_BREAKPOINT:
         case OP_THROW_VERIFICATION_ERROR:
         case OP_EXECUTE_INLINE:
         case OP_EXECUTE_INLINE_RANGE:
         case OP_INVOKE_DIRECT_EMPTY:
         case OP_RETURN_VOID_BARRIER:
         case OP_IGET_QUICK:
         case OP_IGET_WIDE_QUICK:
         case OP_IGET_OBJECT_QUICK:
         case OP_IPUT_QUICK:
         case OP_IPUT_WIDE_QUICK:
         case OP_IPUT_OBJECT_QUICK:
         case OP_INVOKE_VIRTUAL_QUICK:
         case OP_INVOKE_VIRTUAL_QUICK_RANGE:
         case OP_INVOKE_SUPER_QUICK:
         case OP_INVOKE_SUPER_QUICK_RANGE:
         case OP_UNUSED_3E:
         case OP_UNUSED_3F:
         case OP_UNUSED_40:
         case OP_UNUSED_41:
         case OP_UNUSED_42:
         case OP_UNUSED_43:
         case OP_UNUSED_73:
         case OP_UNUSED_79:
         case OP_UNUSED_7A:
         case OP_UNUSED_FF:
             LOGE("VFY: unexpected opcode %02x\n", decInsn.opCode);
             okay = false;
             break;

         /*
          * DO NOT add a "default" clause here.  Without it the compiler will
          * complain if an instruction is missing (which is desirable).
          */
         }

         if (!okay) {
             LOG_VFY_METH(meth, "VFY:  rejecting opcode 0x%02x at 0x%04x\n",
                 decInsn.opCode, codeOffset);
             return false;
         }

         /*
          * Certain types of instructions can be GC points.  To support precise
          * GC, all such instructions must export the PC in the interpreter,
          * or the GC won't be able to identify the current PC for the thread.
          */
         const int kGcMask = kInstrCanBranch | kInstrCanSwitch |
             kInstrCanThrow | kInstrCanReturn;

         InstructionFlags opFlags = dexGetInstrFlags(decInsn.opCode);
         if ((opFlags & kGcMask) != 0) {
             /*
              * This instruction is probably a GC point.  Branch instructions
              * only qualify if they go backward, so for those we need to
              * check the offset.
              */
             int offset;
             bool unused;
             if ((opFlags & kInstrCanBranch) != 0) {
                 /*
                  * Get the target.  This is slightly redundant, since the
                  * component was tagged with kVfyBranch, but it's easier
                  * to just grab it again than cart the state around.
                  */
                 if (!dvmGetBranchTarget(meth, insnFlags, codeOffset, &offset,
                         &unused))
                 {
                     /* should never happen */
                     LOGE("VFY: opcode %02x flagged as can branch, no target\n",
                         decInsn.opCode);
                     dvmAbort();
                 }
                 if (offset <= 0) {
                     /* backward branch, set GC flag */
                     dvmInsnSetGcPoint(insnFlags, codeOffset, true);
                 }
             } else {
                 /* not a branch instruction, always set GC flag */
                 dvmInsnSetGcPoint(insnFlags, codeOffset, true);
             }
         }

         assert(width > 0);
         codeOffset += width;
         insns += width;
     }

     /* make sure the last instruction ends at the end of the insn area */
     if (codeOffset != vdata->insnsSize) {
         LOG_VFY_METH(meth,
             "VFY: code did not end when expected (end at %d, count %d)\n",
             codeOffset, vdata->insnsSize);
         return false;
     }

     return true;
 }