/* * Copyright (c) 2007 The Hewlett-Packard Development Company * All rights reserved. * * Redistribution and use of this software in source and binary forms, * with or without modification, are permitted provided that the * following conditions are met: * * The software must be used only for Non-Commercial Use which means any * use which is NOT directed to receiving any direct monetary * compensation for, or commercial advantage from such use. Illustrative * examples of non-commercial use are academic research, personal study, * teaching, education and corporate research & development. * Illustrative examples of commercial use are distributing products for * commercial advantage and providing services using the software for * commercial advantage. * * If you wish to use this software or functionality therein that may be * covered by patents for commercial use, please contact: * Director of Intellectual Property Licensing * Office of Strategy and Technology * Hewlett-Packard Company * 1501 Page Mill Road * Palo Alto, California 94304 * * Redistributions of source code must retain the above copyright notice, * this list of conditions and the following disclaimer. Redistributions * in binary form must reproduce the above copyright notice, this list of * conditions and the following disclaimer in the documentation and/or * other materials provided with the distribution. Neither the name of * the COPYRIGHT HOLDER(s), HEWLETT-PACKARD COMPANY, nor the names of its * contributors may be used to endorse or promote products derived from * this software without specific prior written permission. No right of * sublicense is granted herewith. Derivatives of the software and * output created using the software may be prepared, but only for * Non-Commercial Uses. Derivatives of the software may be shared with * others provided: (i) the others agree to abide by the list of * conditions herein which includes the Non-Commercial Use restrictions; * and (ii) such Derivatives of the software include the above copyright * notice to acknowledge the contribution from this software where * applicable, this list of conditions and the disclaimer below. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. * * Authors: Gabe Black */ #include "arch/x86/predecoder.hh" #include "base/misc.hh" #include "base/trace.hh" #include "sim/host.hh" namespace X86ISA { void Predecoder::doReset() { origPC = basePC + offset; DPRINTF(Predecoder, "Setting origPC to %#x\n", origPC); emi.rex = 0; emi.legacy = 0; emi.opcode.num = 0; emi.opcode.op = 0; emi.opcode.prefixA = emi.opcode.prefixB = 0; immediateCollected = 0; emi.immediate = 0; emi.displacement = 0; emi.modRM = 0; emi.sib = 0; emi.mode = 0; } void Predecoder::process() { //This function drives the predecoder state machine. //Some sanity checks. You shouldn't try to process more bytes if //there aren't any, and you shouldn't overwrite an already //predecoder ExtMachInst. assert(!outOfBytes); assert(!emiIsReady); //While there's still something to do... while(!emiIsReady && !outOfBytes) { uint8_t nextByte = getNextByte(); switch(state) { case ResetState: doReset(); state = PrefixState; case PrefixState: state = doPrefixState(nextByte); break; case OpcodeState: state = doOpcodeState(nextByte); break; case ModRMState: state = doModRMState(nextByte); break; case SIBState: state = doSIBState(nextByte); break; case DisplacementState: state = doDisplacementState(); break; case ImmediateState: state = doImmediateState(); break; case ErrorState: panic("Went to the error state in the predecoder.\n"); default: panic("Unrecognized state! %d\n", state); } } } //Either get a prefix and record it in the ExtMachInst, or send the //state machine on to get the opcode(s). Predecoder::State Predecoder::doPrefixState(uint8_t nextByte) { uint8_t prefix = Prefixes[nextByte]; State nextState = PrefixState; if(prefix) consumeByte(); switch(prefix) { //Operand size override prefixes case OperandSizeOverride: DPRINTF(Predecoder, "Found operand size override prefix.\n"); emi.legacy.op = true; break; case AddressSizeOverride: DPRINTF(Predecoder, "Found address size override prefix.\n"); emi.legacy.addr = true; break; //Segment override prefixes case CSOverride: case DSOverride: case ESOverride: case FSOverride: case GSOverride: case SSOverride: DPRINTF(Predecoder, "Found segment override.\n"); emi.legacy.seg = prefix; break; case Lock: DPRINTF(Predecoder, "Found lock prefix.\n"); emi.legacy.lock = true; break; case Rep: DPRINTF(Predecoder, "Found rep prefix.\n"); emi.legacy.rep = true; break; case Repne: DPRINTF(Predecoder, "Found repne prefix.\n"); emi.legacy.repne = true; break; case RexPrefix: DPRINTF(Predecoder, "Found Rex prefix %#x.\n", nextByte); emi.rex = nextByte; break; case 0: nextState = OpcodeState; break; default: panic("Unrecognized prefix %#x\n", nextByte); } return nextState; } //Load all the opcodes (currently up to 2) and then figure out //what immediate and/or ModRM is needed. Predecoder::State Predecoder::doOpcodeState(uint8_t nextByte) { State nextState = ErrorState; emi.opcode.num++; //We can't handle 3+ byte opcodes right now assert(emi.opcode.num < 3); consumeByte(); if(emi.opcode.num == 1 && nextByte == 0x0f) { nextState = OpcodeState; DPRINTF(Predecoder, "Found two byte opcode.\n"); emi.opcode.prefixA = nextByte; } else if(emi.opcode.num == 2 && (nextByte == 0x0f || (nextByte & 0xf8) == 0x38)) { panic("Three byte opcodes aren't yet supported!\n"); nextState = OpcodeState; DPRINTF(Predecoder, "Found three byte opcode.\n"); emi.opcode.prefixB = nextByte; } else { DPRINTF(Predecoder, "Found opcode %#x.\n", nextByte); emi.opcode.op = nextByte; //Figure out the effective operand size. This can be overriden to //a fixed value at the decoder level. int logOpSize; if(/*FIXME long mode*/1) { if(emi.rex.w) logOpSize = 3; // 64 bit operand size else if(emi.legacy.op) logOpSize = 1; // 16 bit operand size else logOpSize = 2; // 32 bit operand size } else if(/*FIXME default 32*/1) { if(emi.legacy.op) logOpSize = 1; // 16 bit operand size else logOpSize = 2; // 32 bit operand size } else // 16 bit default operand size { if(emi.legacy.op) logOpSize = 2; // 32 bit operand size else logOpSize = 1; // 16 bit operand size } //Set the actual op size emi.opSize = 1 << logOpSize; //Figure out the effective address size. This can be overriden to //a fixed value at the decoder level. int logAddrSize; if(/*FIXME 64-bit mode*/1) { if(emi.legacy.addr) logAddrSize = 2; // 32 bit address size else logAddrSize = 3; // 64 bit address size } else if(/*FIXME default 32*/1) { if(emi.legacy.addr) logAddrSize = 1; // 16 bit address size else logAddrSize = 2; // 32 bit address size } else // 16 bit default operand size { if(emi.legacy.addr) logAddrSize = 2; // 32 bit address size else logAddrSize = 1; // 16 bit address size } //Set the actual address size emi.addrSize = 1 << logAddrSize; //Figure out how big of an immediate we'll retreive based //on the opcode. int immType = ImmediateType[emi.opcode.num - 1][nextByte]; if (emi.opcode.num == 1 && nextByte >= 0xA0 && nextByte <= 0xA3) immediateSize = SizeTypeToSize[logAddrSize - 1][immType]; else immediateSize = SizeTypeToSize[logOpSize - 1][immType]; //Determine what to expect next if (UsesModRM[emi.opcode.num - 1][nextByte]) { nextState = ModRMState; } else { if(immediateSize) { nextState = ImmediateState; } else { emiIsReady = true; nextState = ResetState; } } } return nextState; } //Get the ModRM byte and determine what displacement, if any, there is. //Also determine whether or not to get the SIB byte, displacement, or //immediate next. Predecoder::State Predecoder::doModRMState(uint8_t nextByte) { State nextState = ErrorState; ModRM modRM; modRM = nextByte; DPRINTF(Predecoder, "Found modrm byte %#x.\n", nextByte); if (0) {//FIXME in 16 bit mode //figure out 16 bit displacement size if(modRM.mod == 0 && modRM.rm == 6 || modRM.mod == 2) displacementSize = 2; else if(modRM.mod == 1) displacementSize = 1; else displacementSize = 0; } else { //figure out 32/64 bit displacement size if(modRM.mod == 0 && modRM.rm == 5 || modRM.mod == 2) displacementSize = 4; else if(modRM.mod == 1) displacementSize = 1; else displacementSize = 0; } // The "test" instruction in group 3 needs an immediate, even though // the other instructions with the same actual opcode don't. if (emi.opcode.num == 1 && (modRM.reg & 0x6) == 0) { if (emi.opcode.op == 0xF6) immediateSize = 1; else if (emi.opcode.op == 0xF7) immediateSize = (emi.opSize == 8) ? 4 : emi.opSize; } //If there's an SIB, get that next. //There is no SIB in 16 bit mode. if (modRM.rm == 4 && modRM.mod != 3) { // && in 32/64 bit mode) nextState = SIBState; } else if(displacementSize) { nextState = DisplacementState; } else if(immediateSize) { nextState = ImmediateState; } else { emiIsReady = true; nextState = ResetState; } //The ModRM byte is consumed no matter what consumeByte(); emi.modRM = modRM; return nextState; } //Get the SIB byte. We don't do anything with it at this point, other //than storing it in the ExtMachInst. Determine if we need to get a //displacement or immediate next. Predecoder::State Predecoder::doSIBState(uint8_t nextByte) { State nextState = ErrorState; emi.sib = nextByte; DPRINTF(Predecoder, "Found SIB byte %#x.\n", nextByte); consumeByte(); if (emi.modRM.mod == 0 && emi.sib.base == 5) displacementSize = 4; if (displacementSize) { nextState = DisplacementState; } else if(immediateSize) { nextState = ImmediateState; } else { emiIsReady = true; nextState = ResetState; } return nextState; } //Gather up the displacement, or at least as much of it //as we can get. Predecoder::State Predecoder::doDisplacementState() { State nextState = ErrorState; getImmediate(immediateCollected, emi.displacement, displacementSize); DPRINTF(Predecoder, "Collecting %d byte displacement, got %d bytes.\n", displacementSize, immediateCollected); if(displacementSize == immediateCollected) { //Reset this for other immediates. immediateCollected = 0; //Sign extend the displacement switch(displacementSize) { case 1: emi.displacement = sext<8>(emi.displacement); break; case 2: emi.displacement = sext<16>(emi.displacement); break; case 4: emi.displacement = sext<32>(emi.displacement); break; default: panic("Undefined displacement size!\n"); } DPRINTF(Predecoder, "Collected displacement %#x.\n", emi.displacement); if(immediateSize) { nextState = ImmediateState; } else { emiIsReady = true; nextState = ResetState; } } else nextState = DisplacementState; return nextState; } //Gather up the immediate, or at least as much of it //as we can get Predecoder::State Predecoder::doImmediateState() { State nextState = ErrorState; getImmediate(immediateCollected, emi.immediate, immediateSize); DPRINTF(Predecoder, "Collecting %d byte immediate, got %d bytes.\n", immediateSize, immediateCollected); if(immediateSize == immediateCollected) { //Reset this for other immediates. immediateCollected = 0; //XXX Warning! The following is an observed pattern and might //not always be true! //Instructions which use 64 bit operands but 32 bit immediates //need to have the immediate sign extended to 64 bits. //Instructions which use true 64 bit immediates won't be //affected, and instructions that use true 32 bit immediates //won't notice. switch(immediateSize) { case 4: emi.immediate = sext<32>(emi.immediate); break; case 1: emi.immediate = sext<8>(emi.immediate); } DPRINTF(Predecoder, "Collected immediate %#x.\n", emi.immediate); emiIsReady = true; nextState = ResetState; } else nextState = ImmediateState; return nextState; } }