e3fb9afa79
Also change to ref counted DynInst. SConscript: Add branch predictor, BTB, load store queue, and storesets. arch/isa_parser.py: Specify the template parameter for AlphaDynInst base/traceflags.py: Add load store queue, store set, and mem dependence unit to the list of trace flags. cpu/base_dyn_inst.cc: Change formating, add in debug statement. cpu/base_dyn_inst.hh: Change DynInst to be RefCounted, add flag to clear whether or not this instruction can commit. This is likely to be removed in the future. cpu/beta_cpu/alpha_dyn_inst.cc: AlphaDynInst has been changed to be templated, so now this CC file is just used to force instantiations of AlphaDynInst. cpu/beta_cpu/alpha_dyn_inst.hh: Changed AlphaDynInst to be templated on Impl. Removed some unnecessary functions. cpu/beta_cpu/alpha_full_cpu.cc: AlphaFullCPU has been changed to be templated, so this CC file is now just used to force instantation of AlphaFullCPU. cpu/beta_cpu/alpha_full_cpu.hh: Change AlphaFullCPU to be templated on Impl. cpu/beta_cpu/alpha_impl.hh: Update it to reflect AlphaDynInst and AlphaFullCPU being templated on Impl. Also removed time buffers from here, as they are really a part of the CPU and are thus in the CPU policy now. cpu/beta_cpu/alpha_params.hh: Make AlphaSimpleParams inherit from the BaseFullCPU so that it doesn't need to specifically declare any parameters that are already in the BaseFullCPU. cpu/beta_cpu/comm.hh: Changed the structure of the time buffer communication structs. Now they include the size of the packet of instructions it is sending. Added some parameters to the backwards communication struct, mainly for squashing. cpu/beta_cpu/commit.hh: Update typenames to reflect change in location of time buffer structs. Update DynInst to DynInstPtr (it is refcounted now). cpu/beta_cpu/commit_impl.hh: Formatting changes mainly. Also sends back proper information on branch mispredicts so that the bpred unit can update itself. Updated behavior for non-speculative instructions (stores, any other non-spec instructions): once they reach the head of the ROB, the ROB signals back to the IQ that it can go ahead and issue the non-speculative instruction. The instruction itself is updated so that commit won't try to commit it again until it is done executing. cpu/beta_cpu/cpu_policy.hh: Added branch prediction unit, mem dependence prediction unit, load store queue. Moved time buffer structs from AlphaSimpleImpl to here. cpu/beta_cpu/decode.hh: Changed typedefs to reflect change in location of time buffer structs and also the change from DynInst to ref counted DynInstPtr. cpu/beta_cpu/decode_impl.hh: Continues to buffer instructions even while unblocking now. Changed how it loops through groups of instructions so it can properly block during the middle of a group of instructions. cpu/beta_cpu/fetch.hh: Changed typedefs to reflect change in location of time buffer structs and the change to ref counted DynInsts. Also added in branch brediction unit. cpu/beta_cpu/fetch_impl.hh: Add in branch prediction. Changed how fetch checks inputs and its current state to make for easier logic. cpu/beta_cpu/free_list.cc: Changed int regs and float regs to logically use one flat namespace. Future change will be moving them to a single scoreboard to conserve space. cpu/beta_cpu/free_list.hh: Mostly debugging statements. Might be removed for performance in future. cpu/beta_cpu/full_cpu.cc: Added in some debugging statements. Updated BaseFullCPU to take a params object. cpu/beta_cpu/full_cpu.hh: Added params class within BaseCPU that other param classes will be able to inherit from. Updated typedefs to reflect change in location of time buffer structs and ref counted DynInst. cpu/beta_cpu/iew.hh: Updated typedefs to reflect change in location of time buffer structs and use of ref counted DynInsts. cpu/beta_cpu/iew_impl.hh: Added in load store queue, updated iew to be able to execute non- speculative instructions, instead of having them execute in commit. cpu/beta_cpu/inst_queue.hh: Updated change to ref counted DynInsts. Changed inst queue to hold non-speculative instructions as well, which are issued only when commit signals backwards that a nonspeculative instruction is at the head of the ROB. cpu/beta_cpu/inst_queue_impl.hh: Updated to allow for non-speculative instructions to be in the inst queue. Also added some debug functions. cpu/beta_cpu/regfile.hh: Added debugging statements, changed formatting. cpu/beta_cpu/rename.hh: Updated typedefs, added some functions to clean up code. cpu/beta_cpu/rename_impl.hh: Moved some code into functions to make it easier to read. cpu/beta_cpu/rename_map.cc: Changed int and float reg behavior to use a single flat namespace. In the future, the rename maps can be combined to a single rename map to save space. cpu/beta_cpu/rename_map.hh: Added destructor. cpu/beta_cpu/rob.hh: Updated it with change from DynInst to ref counted DynInst. cpu/beta_cpu/rob_impl.hh: Formatting, updated to use ref counted DynInst. cpu/static_inst.hh: Updated forward declaration for AlphaDynInst now that it is templated. --HG-- extra : convert_revision : 1045f240ee9b6a4bd368e1806aca029ebbdc6dd3
690 lines
18 KiB
C++
690 lines
18 KiB
C++
|
|
#include "base/cprintf.hh"
|
|
#include "base/statistics.hh"
|
|
#include "base/timebuf.hh"
|
|
#include "mem/cache/cache.hh" // for dynamic cast
|
|
#include "mem/mem_interface.hh"
|
|
#include "sim/builder.hh"
|
|
#include "sim/sim_events.hh"
|
|
#include "sim/stats.hh"
|
|
|
|
#include "cpu/beta_cpu/alpha_full_cpu.hh"
|
|
#include "cpu/beta_cpu/alpha_params.hh"
|
|
#include "cpu/beta_cpu/comm.hh"
|
|
|
|
template <class Impl>
|
|
AlphaFullCPU<Impl>::AlphaFullCPU(Params ¶ms)
|
|
: FullBetaCPU<AlphaSimpleImpl>(params)
|
|
{
|
|
DPRINTF(FullCPU, "AlphaFullCPU: Creating AlphaFullCPU object.\n");
|
|
|
|
fetch.setCPU(this);
|
|
decode.setCPU(this);
|
|
rename.setCPU(this);
|
|
iew.setCPU(this);
|
|
commit.setCPU(this);
|
|
|
|
rob.setCPU(this);
|
|
}
|
|
|
|
#ifndef FULL_SYSTEM
|
|
|
|
template <class Impl>
|
|
void
|
|
AlphaFullCPU<Impl>::syscall()
|
|
{
|
|
DPRINTF(FullCPU, "AlphaFullCPU: Syscall() called.\n\n");
|
|
|
|
// Commit stage needs to run as well.
|
|
commit.tick();
|
|
|
|
squashStages();
|
|
|
|
// Temporarily increase this by one to account for the syscall
|
|
// instruction.
|
|
++funcExeInst;
|
|
|
|
// Copy over all important state to xc once all the unrolling is done.
|
|
copyToXC();
|
|
|
|
process->syscall(xc);
|
|
|
|
// Copy over all important state back to CPU.
|
|
copyFromXC();
|
|
|
|
// Decrease funcExeInst by one as the normal commit will handle
|
|
// incrememnting it.
|
|
--funcExeInst;
|
|
}
|
|
|
|
// This is not a pretty function, and should only be used if it is necessary
|
|
// to fake having everything squash all at once (ie for non-full system
|
|
// syscalls). Maybe put this at the FullCPU level?
|
|
template <class Impl>
|
|
void
|
|
AlphaFullCPU<Impl>::squashStages()
|
|
{
|
|
InstSeqNum rob_head = rob.readHeadSeqNum();
|
|
|
|
// Now hack the time buffer to put this sequence number in the places
|
|
// where the stages might read it.
|
|
for (int i = 0; i < 5; ++i)
|
|
{
|
|
timeBuffer.access(-i)->commitInfo.doneSeqNum = rob_head;
|
|
}
|
|
|
|
fetch.squash(rob.readHeadNextPC());
|
|
fetchQueue.advance();
|
|
|
|
decode.squash();
|
|
decodeQueue.advance();
|
|
|
|
rename.squash();
|
|
renameQueue.advance();
|
|
renameQueue.advance();
|
|
|
|
// Be sure to advance the IEW queues so that the commit stage doesn't
|
|
// try to set an instruction as completed at the same time that it
|
|
// might be deleting it.
|
|
iew.squash();
|
|
iewQueue.advance();
|
|
iewQueue.advance();
|
|
|
|
rob.squash(rob_head);
|
|
commit.setSquashing();
|
|
}
|
|
|
|
#endif // FULL_SYSTEM
|
|
|
|
template <class Impl>
|
|
void
|
|
AlphaFullCPU<Impl>::copyToXC()
|
|
{
|
|
PhysRegIndex renamed_reg;
|
|
|
|
// First loop through the integer registers.
|
|
for (int i = 0; i < AlphaISA::NumIntRegs; ++i)
|
|
{
|
|
renamed_reg = renameMap.lookup(i);
|
|
xc->regs.intRegFile[i] = regFile.intRegFile[renamed_reg];
|
|
DPRINTF(FullCPU, "FullCPU: Copying register %i, has data %lli.\n",
|
|
renamed_reg, regFile.intRegFile[renamed_reg]);
|
|
}
|
|
|
|
// Then loop through the floating point registers.
|
|
for (int i = 0; i < AlphaISA::NumFloatRegs; ++i)
|
|
{
|
|
renamed_reg = renameMap.lookup(i + AlphaISA::FP_Base_DepTag);
|
|
xc->regs.floatRegFile.d[i] = regFile.floatRegFile[renamed_reg].d;
|
|
xc->regs.floatRegFile.q[i] = regFile.floatRegFile[renamed_reg].q;
|
|
}
|
|
|
|
xc->regs.miscRegs.fpcr = regFile.miscRegs.fpcr;
|
|
xc->regs.miscRegs.uniq = regFile.miscRegs.uniq;
|
|
xc->regs.miscRegs.lock_flag = regFile.miscRegs.lock_flag;
|
|
xc->regs.miscRegs.lock_addr = regFile.miscRegs.lock_addr;
|
|
|
|
xc->regs.pc = rob.readHeadPC();
|
|
xc->regs.npc = xc->regs.pc+4;
|
|
|
|
xc->func_exe_inst = funcExeInst;
|
|
}
|
|
|
|
// This function will probably mess things up unless the ROB is empty and
|
|
// there are no instructions in the pipeline.
|
|
template <class Impl>
|
|
void
|
|
AlphaFullCPU<Impl>::copyFromXC()
|
|
{
|
|
PhysRegIndex renamed_reg;
|
|
|
|
// First loop through the integer registers.
|
|
for (int i = 0; i < AlphaISA::NumIntRegs; ++i)
|
|
{
|
|
renamed_reg = renameMap.lookup(i);
|
|
|
|
DPRINTF(FullCPU, "FullCPU: Copying over register %i, had data %lli, "
|
|
"now has data %lli.\n",
|
|
renamed_reg, regFile.intRegFile[renamed_reg],
|
|
xc->regs.intRegFile[i]);
|
|
|
|
regFile.intRegFile[renamed_reg] = xc->regs.intRegFile[i];
|
|
}
|
|
|
|
// Then loop through the floating point registers.
|
|
for (int i = 0; i < AlphaISA::NumFloatRegs; ++i)
|
|
{
|
|
renamed_reg = renameMap.lookup(i + AlphaISA::FP_Base_DepTag);
|
|
regFile.floatRegFile[renamed_reg].d = xc->regs.floatRegFile.d[i];
|
|
regFile.floatRegFile[renamed_reg].q = xc->regs.floatRegFile.q[i] ;
|
|
}
|
|
|
|
// Then loop through the misc registers.
|
|
regFile.miscRegs.fpcr = xc->regs.miscRegs.fpcr;
|
|
regFile.miscRegs.uniq = xc->regs.miscRegs.uniq;
|
|
regFile.miscRegs.lock_flag = xc->regs.miscRegs.lock_flag;
|
|
regFile.miscRegs.lock_addr = xc->regs.miscRegs.lock_addr;
|
|
|
|
// Then finally set the PC and the next PC.
|
|
// regFile.pc = xc->regs.pc;
|
|
// regFile.npc = xc->regs.npc;
|
|
|
|
funcExeInst = xc->func_exe_inst;
|
|
}
|
|
|
|
#ifdef FULL_SYSTEM
|
|
|
|
template <class Impl>
|
|
uint64_t *
|
|
AlphaFullCPU<Impl>::getIpr()
|
|
{
|
|
return regs.ipr;
|
|
}
|
|
|
|
template <class Impl>
|
|
uint64_t
|
|
AlphaFullCPU<Impl>::readIpr(int idx, Fault &fault)
|
|
{
|
|
uint64_t *ipr = getIpr();
|
|
uint64_t retval = 0; // return value, default 0
|
|
|
|
switch (idx) {
|
|
case AlphaISA::IPR_PALtemp0:
|
|
case AlphaISA::IPR_PALtemp1:
|
|
case AlphaISA::IPR_PALtemp2:
|
|
case AlphaISA::IPR_PALtemp3:
|
|
case AlphaISA::IPR_PALtemp4:
|
|
case AlphaISA::IPR_PALtemp5:
|
|
case AlphaISA::IPR_PALtemp6:
|
|
case AlphaISA::IPR_PALtemp7:
|
|
case AlphaISA::IPR_PALtemp8:
|
|
case AlphaISA::IPR_PALtemp9:
|
|
case AlphaISA::IPR_PALtemp10:
|
|
case AlphaISA::IPR_PALtemp11:
|
|
case AlphaISA::IPR_PALtemp12:
|
|
case AlphaISA::IPR_PALtemp13:
|
|
case AlphaISA::IPR_PALtemp14:
|
|
case AlphaISA::IPR_PALtemp15:
|
|
case AlphaISA::IPR_PALtemp16:
|
|
case AlphaISA::IPR_PALtemp17:
|
|
case AlphaISA::IPR_PALtemp18:
|
|
case AlphaISA::IPR_PALtemp19:
|
|
case AlphaISA::IPR_PALtemp20:
|
|
case AlphaISA::IPR_PALtemp21:
|
|
case AlphaISA::IPR_PALtemp22:
|
|
case AlphaISA::IPR_PALtemp23:
|
|
case AlphaISA::IPR_PAL_BASE:
|
|
|
|
case AlphaISA::IPR_IVPTBR:
|
|
case AlphaISA::IPR_DC_MODE:
|
|
case AlphaISA::IPR_MAF_MODE:
|
|
case AlphaISA::IPR_ISR:
|
|
case AlphaISA::IPR_EXC_ADDR:
|
|
case AlphaISA::IPR_IC_PERR_STAT:
|
|
case AlphaISA::IPR_DC_PERR_STAT:
|
|
case AlphaISA::IPR_MCSR:
|
|
case AlphaISA::IPR_ASTRR:
|
|
case AlphaISA::IPR_ASTER:
|
|
case AlphaISA::IPR_SIRR:
|
|
case AlphaISA::IPR_ICSR:
|
|
case AlphaISA::IPR_ICM:
|
|
case AlphaISA::IPR_DTB_CM:
|
|
case AlphaISA::IPR_IPLR:
|
|
case AlphaISA::IPR_INTID:
|
|
case AlphaISA::IPR_PMCTR:
|
|
// no side-effect
|
|
retval = ipr[idx];
|
|
break;
|
|
|
|
case AlphaISA::IPR_CC:
|
|
retval |= ipr[idx] & ULL(0xffffffff00000000);
|
|
retval |= curTick & ULL(0x00000000ffffffff);
|
|
break;
|
|
|
|
case AlphaISA::IPR_VA:
|
|
retval = ipr[idx];
|
|
break;
|
|
|
|
case AlphaISA::IPR_VA_FORM:
|
|
case AlphaISA::IPR_MM_STAT:
|
|
case AlphaISA::IPR_IFAULT_VA_FORM:
|
|
case AlphaISA::IPR_EXC_MASK:
|
|
case AlphaISA::IPR_EXC_SUM:
|
|
retval = ipr[idx];
|
|
break;
|
|
|
|
case AlphaISA::IPR_DTB_PTE:
|
|
{
|
|
AlphaISA::PTE &pte = dtb->index(!misspeculating());
|
|
|
|
retval |= ((u_int64_t)pte.ppn & ULL(0x7ffffff)) << 32;
|
|
retval |= ((u_int64_t)pte.xre & ULL(0xf)) << 8;
|
|
retval |= ((u_int64_t)pte.xwe & ULL(0xf)) << 12;
|
|
retval |= ((u_int64_t)pte.fonr & ULL(0x1)) << 1;
|
|
retval |= ((u_int64_t)pte.fonw & ULL(0x1))<< 2;
|
|
retval |= ((u_int64_t)pte.asma & ULL(0x1)) << 4;
|
|
retval |= ((u_int64_t)pte.asn & ULL(0x7f)) << 57;
|
|
}
|
|
break;
|
|
|
|
// write only registers
|
|
case AlphaISA::IPR_HWINT_CLR:
|
|
case AlphaISA::IPR_SL_XMIT:
|
|
case AlphaISA::IPR_DC_FLUSH:
|
|
case AlphaISA::IPR_IC_FLUSH:
|
|
case AlphaISA::IPR_ALT_MODE:
|
|
case AlphaISA::IPR_DTB_IA:
|
|
case AlphaISA::IPR_DTB_IAP:
|
|
case AlphaISA::IPR_ITB_IA:
|
|
case AlphaISA::IPR_ITB_IAP:
|
|
fault = Unimplemented_Opcode_Fault;
|
|
break;
|
|
|
|
default:
|
|
// invalid IPR
|
|
fault = Unimplemented_Opcode_Fault;
|
|
break;
|
|
}
|
|
|
|
return retval;
|
|
}
|
|
|
|
template <class Impl>
|
|
Fault
|
|
AlphaFullCPU<Impl>::setIpr(int idx, uint64_t val)
|
|
{
|
|
uint64_t *ipr = getIpr();
|
|
uint64_t old;
|
|
|
|
if (misspeculating())
|
|
return No_Fault;
|
|
|
|
switch (idx) {
|
|
case AlphaISA::IPR_PALtemp0:
|
|
case AlphaISA::IPR_PALtemp1:
|
|
case AlphaISA::IPR_PALtemp2:
|
|
case AlphaISA::IPR_PALtemp3:
|
|
case AlphaISA::IPR_PALtemp4:
|
|
case AlphaISA::IPR_PALtemp5:
|
|
case AlphaISA::IPR_PALtemp6:
|
|
case AlphaISA::IPR_PALtemp7:
|
|
case AlphaISA::IPR_PALtemp8:
|
|
case AlphaISA::IPR_PALtemp9:
|
|
case AlphaISA::IPR_PALtemp10:
|
|
case AlphaISA::IPR_PALtemp11:
|
|
case AlphaISA::IPR_PALtemp12:
|
|
case AlphaISA::IPR_PALtemp13:
|
|
case AlphaISA::IPR_PALtemp14:
|
|
case AlphaISA::IPR_PALtemp15:
|
|
case AlphaISA::IPR_PALtemp16:
|
|
case AlphaISA::IPR_PALtemp17:
|
|
case AlphaISA::IPR_PALtemp18:
|
|
case AlphaISA::IPR_PALtemp19:
|
|
case AlphaISA::IPR_PALtemp20:
|
|
case AlphaISA::IPR_PALtemp21:
|
|
case AlphaISA::IPR_PALtemp22:
|
|
case AlphaISA::IPR_PAL_BASE:
|
|
case AlphaISA::IPR_IC_PERR_STAT:
|
|
case AlphaISA::IPR_DC_PERR_STAT:
|
|
case AlphaISA::IPR_PMCTR:
|
|
// write entire quad w/ no side-effect
|
|
ipr[idx] = val;
|
|
break;
|
|
|
|
case AlphaISA::IPR_CC_CTL:
|
|
// This IPR resets the cycle counter. We assume this only
|
|
// happens once... let's verify that.
|
|
assert(ipr[idx] == 0);
|
|
ipr[idx] = 1;
|
|
break;
|
|
|
|
case AlphaISA::IPR_CC:
|
|
// This IPR only writes the upper 64 bits. It's ok to write
|
|
// all 64 here since we mask out the lower 32 in rpcc (see
|
|
// isa_desc).
|
|
ipr[idx] = val;
|
|
break;
|
|
|
|
case AlphaISA::IPR_PALtemp23:
|
|
// write entire quad w/ no side-effect
|
|
old = ipr[idx];
|
|
ipr[idx] = val;
|
|
kernelStats.context(old, val);
|
|
break;
|
|
|
|
case AlphaISA::IPR_DTB_PTE:
|
|
// write entire quad w/ no side-effect, tag is forthcoming
|
|
ipr[idx] = val;
|
|
break;
|
|
|
|
case AlphaISA::IPR_EXC_ADDR:
|
|
// second least significant bit in PC is always zero
|
|
ipr[idx] = val & ~2;
|
|
break;
|
|
|
|
case AlphaISA::IPR_ASTRR:
|
|
case AlphaISA::IPR_ASTER:
|
|
// only write least significant four bits - privilege mask
|
|
ipr[idx] = val & 0xf;
|
|
break;
|
|
|
|
case AlphaISA::IPR_IPLR:
|
|
#ifdef DEBUG
|
|
if (break_ipl != -1 && break_ipl == (val & 0x1f))
|
|
debug_break();
|
|
#endif
|
|
|
|
// only write least significant five bits - interrupt level
|
|
ipr[idx] = val & 0x1f;
|
|
kernelStats.swpipl(ipr[idx]);
|
|
break;
|
|
|
|
case AlphaISA::IPR_DTB_CM:
|
|
kernelStats.mode((val & 0x18) != 0);
|
|
|
|
case AlphaISA::IPR_ICM:
|
|
// only write two mode bits - processor mode
|
|
ipr[idx] = val & 0x18;
|
|
break;
|
|
|
|
case AlphaISA::IPR_ALT_MODE:
|
|
// only write two mode bits - processor mode
|
|
ipr[idx] = val & 0x18;
|
|
break;
|
|
|
|
case AlphaISA::IPR_MCSR:
|
|
// more here after optimization...
|
|
ipr[idx] = val;
|
|
break;
|
|
|
|
case AlphaISA::IPR_SIRR:
|
|
// only write software interrupt mask
|
|
ipr[idx] = val & 0x7fff0;
|
|
break;
|
|
|
|
case AlphaISA::IPR_ICSR:
|
|
ipr[idx] = val & ULL(0xffffff0300);
|
|
break;
|
|
|
|
case AlphaISA::IPR_IVPTBR:
|
|
case AlphaISA::IPR_MVPTBR:
|
|
ipr[idx] = val & ULL(0xffffffffc0000000);
|
|
break;
|
|
|
|
case AlphaISA::IPR_DC_TEST_CTL:
|
|
ipr[idx] = val & 0x1ffb;
|
|
break;
|
|
|
|
case AlphaISA::IPR_DC_MODE:
|
|
case AlphaISA::IPR_MAF_MODE:
|
|
ipr[idx] = val & 0x3f;
|
|
break;
|
|
|
|
case AlphaISA::IPR_ITB_ASN:
|
|
ipr[idx] = val & 0x7f0;
|
|
break;
|
|
|
|
case AlphaISA::IPR_DTB_ASN:
|
|
ipr[idx] = val & ULL(0xfe00000000000000);
|
|
break;
|
|
|
|
case AlphaISA::IPR_EXC_SUM:
|
|
case AlphaISA::IPR_EXC_MASK:
|
|
// any write to this register clears it
|
|
ipr[idx] = 0;
|
|
break;
|
|
|
|
case AlphaISA::IPR_INTID:
|
|
case AlphaISA::IPR_SL_RCV:
|
|
case AlphaISA::IPR_MM_STAT:
|
|
case AlphaISA::IPR_ITB_PTE_TEMP:
|
|
case AlphaISA::IPR_DTB_PTE_TEMP:
|
|
// read-only registers
|
|
return Unimplemented_Opcode_Fault;
|
|
|
|
case AlphaISA::IPR_HWINT_CLR:
|
|
case AlphaISA::IPR_SL_XMIT:
|
|
case AlphaISA::IPR_DC_FLUSH:
|
|
case AlphaISA::IPR_IC_FLUSH:
|
|
// the following are write only
|
|
ipr[idx] = val;
|
|
break;
|
|
|
|
case AlphaISA::IPR_DTB_IA:
|
|
// really a control write
|
|
ipr[idx] = 0;
|
|
|
|
dtb->flushAll();
|
|
break;
|
|
|
|
case AlphaISA::IPR_DTB_IAP:
|
|
// really a control write
|
|
ipr[idx] = 0;
|
|
|
|
dtb->flushProcesses();
|
|
break;
|
|
|
|
case AlphaISA::IPR_DTB_IS:
|
|
// really a control write
|
|
ipr[idx] = val;
|
|
|
|
dtb->flushAddr(val, DTB_ASN_ASN(ipr[AlphaISA::IPR_DTB_ASN]));
|
|
break;
|
|
|
|
case AlphaISA::IPR_DTB_TAG: {
|
|
struct AlphaISA::PTE pte;
|
|
|
|
// FIXME: granularity hints NYI...
|
|
if (DTB_PTE_GH(ipr[AlphaISA::IPR_DTB_PTE]) != 0)
|
|
panic("PTE GH field != 0");
|
|
|
|
// write entire quad
|
|
ipr[idx] = val;
|
|
|
|
// construct PTE for new entry
|
|
pte.ppn = DTB_PTE_PPN(ipr[AlphaISA::IPR_DTB_PTE]);
|
|
pte.xre = DTB_PTE_XRE(ipr[AlphaISA::IPR_DTB_PTE]);
|
|
pte.xwe = DTB_PTE_XWE(ipr[AlphaISA::IPR_DTB_PTE]);
|
|
pte.fonr = DTB_PTE_FONR(ipr[AlphaISA::IPR_DTB_PTE]);
|
|
pte.fonw = DTB_PTE_FONW(ipr[AlphaISA::IPR_DTB_PTE]);
|
|
pte.asma = DTB_PTE_ASMA(ipr[AlphaISA::IPR_DTB_PTE]);
|
|
pte.asn = DTB_ASN_ASN(ipr[AlphaISA::IPR_DTB_ASN]);
|
|
|
|
// insert new TAG/PTE value into data TLB
|
|
dtb->insert(val, pte);
|
|
}
|
|
break;
|
|
|
|
case AlphaISA::IPR_ITB_PTE: {
|
|
struct AlphaISA::PTE pte;
|
|
|
|
// FIXME: granularity hints NYI...
|
|
if (ITB_PTE_GH(val) != 0)
|
|
panic("PTE GH field != 0");
|
|
|
|
// write entire quad
|
|
ipr[idx] = val;
|
|
|
|
// construct PTE for new entry
|
|
pte.ppn = ITB_PTE_PPN(val);
|
|
pte.xre = ITB_PTE_XRE(val);
|
|
pte.xwe = 0;
|
|
pte.fonr = ITB_PTE_FONR(val);
|
|
pte.fonw = ITB_PTE_FONW(val);
|
|
pte.asma = ITB_PTE_ASMA(val);
|
|
pte.asn = ITB_ASN_ASN(ipr[AlphaISA::IPR_ITB_ASN]);
|
|
|
|
// insert new TAG/PTE value into data TLB
|
|
itb->insert(ipr[AlphaISA::IPR_ITB_TAG], pte);
|
|
}
|
|
break;
|
|
|
|
case AlphaISA::IPR_ITB_IA:
|
|
// really a control write
|
|
ipr[idx] = 0;
|
|
|
|
itb->flushAll();
|
|
break;
|
|
|
|
case AlphaISA::IPR_ITB_IAP:
|
|
// really a control write
|
|
ipr[idx] = 0;
|
|
|
|
itb->flushProcesses();
|
|
break;
|
|
|
|
case AlphaISA::IPR_ITB_IS:
|
|
// really a control write
|
|
ipr[idx] = val;
|
|
|
|
itb->flushAddr(val, ITB_ASN_ASN(ipr[AlphaISA::IPR_ITB_ASN]));
|
|
break;
|
|
|
|
default:
|
|
// invalid IPR
|
|
return Unimplemented_Opcode_Fault;
|
|
}
|
|
|
|
// no error...
|
|
return No_Fault;
|
|
|
|
}
|
|
|
|
template <class Impl>
|
|
int
|
|
AlphaFullCPU<Impl>::readIntrFlag()
|
|
{
|
|
return regs.intrflag;
|
|
}
|
|
|
|
template <class Impl>
|
|
void
|
|
AlphaFullCPU<Impl>::setIntrFlag(int val)
|
|
{
|
|
regs.intrflag = val;
|
|
}
|
|
|
|
// Maybe have this send back from IEW stage to squash and update PC.
|
|
template <class Impl>
|
|
Fault
|
|
AlphaFullCPU<Impl>::hwrei()
|
|
{
|
|
uint64_t *ipr = getIpr();
|
|
|
|
if (!PC_PAL(regs.pc))
|
|
return Unimplemented_Opcode_Fault;
|
|
|
|
setNextPC(ipr[AlphaISA::IPR_EXC_ADDR]);
|
|
|
|
if (!misspeculating()) {
|
|
kernelStats.hwrei();
|
|
|
|
if ((ipr[AlphaISA::IPR_EXC_ADDR] & 1) == 0)
|
|
AlphaISA::swap_palshadow(®s, false);
|
|
|
|
AlphaISA::check_interrupts = true;
|
|
}
|
|
|
|
// FIXME: XXX check for interrupts? XXX
|
|
return No_Fault;
|
|
}
|
|
|
|
template <class Impl>
|
|
bool
|
|
AlphaFullCPU<Impl>::inPalMode()
|
|
{
|
|
return PC_PAL(readPC());
|
|
}
|
|
|
|
template <class Impl>
|
|
bool
|
|
AlphaFullCPU<Impl>::simPalCheck(int palFunc)
|
|
{
|
|
kernelStats.callpal(palFunc);
|
|
|
|
switch (palFunc) {
|
|
case PAL::halt:
|
|
halt();
|
|
if (--System::numSystemsRunning == 0)
|
|
new SimExitEvent("all cpus halted");
|
|
break;
|
|
|
|
case PAL::bpt:
|
|
case PAL::bugchk:
|
|
if (system->breakpoint())
|
|
return false;
|
|
break;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
// Probably shouldn't be able to switch to the trap handler as quickly as
|
|
// this. Also needs to get the exception restart address from the commit
|
|
// stage.
|
|
template <class Impl>
|
|
void
|
|
AlphaFullCPU<Impl>::trap(Fault fault)
|
|
{
|
|
uint64_t PC = commit.readPC();
|
|
|
|
DPRINTF(Fault, "Fault %s\n", FaultName(fault));
|
|
Stats::recordEvent(csprintf("Fault %s", FaultName(fault)));
|
|
|
|
assert(!misspeculating());
|
|
kernelStats.fault(fault);
|
|
|
|
if (fault == Arithmetic_Fault)
|
|
panic("Arithmetic traps are unimplemented!");
|
|
|
|
AlphaISA::InternalProcReg *ipr = getIpr();
|
|
|
|
// exception restart address - Get the commit PC
|
|
if (fault != Interrupt_Fault || !PC_PAL(PC))
|
|
ipr[AlphaISA::IPR_EXC_ADDR] = PC;
|
|
|
|
if (fault == Pal_Fault || fault == Arithmetic_Fault /* ||
|
|
fault == Interrupt_Fault && !PC_PAL(regs.pc) */) {
|
|
// traps... skip faulting instruction
|
|
ipr[AlphaISA::IPR_EXC_ADDR] += 4;
|
|
}
|
|
|
|
if (!PC_PAL(PC))
|
|
AlphaISA::swap_palshadow(®s, true);
|
|
|
|
setPC( ipr[AlphaISA::IPR_PAL_BASE] + AlphaISA::fault_addr[fault] );
|
|
setNextPC(PC + sizeof(MachInst));
|
|
}
|
|
|
|
template <class Impl>
|
|
void
|
|
AlphaFullCPU<Impl>::processInterrupts()
|
|
{
|
|
// Check for interrupts here. For now can copy the code that exists
|
|
// within isa_fullsys_traits.hh.
|
|
}
|
|
|
|
// swap_palshadow swaps in the values of the shadow registers and
|
|
// swaps them with the values of the physical registers that map to the
|
|
// same logical index.
|
|
template <class Impl>
|
|
void
|
|
AlphaFullCPU<Impl>::swap_palshadow(RegFile *regs, bool use_shadow)
|
|
{
|
|
if (palShadowEnabled == use_shadow)
|
|
panic("swap_palshadow: wrong PAL shadow state");
|
|
|
|
palShadowEnabled = use_shadow;
|
|
|
|
// Will have to lookup in rename map to get physical registers, then
|
|
// swap.
|
|
for (int i = 0; i < AlphaISA::NumIntRegs; i++) {
|
|
if (reg_redir[i]) {
|
|
AlphaISA::IntReg temp = regs->intRegFile[i];
|
|
regs->intRegFile[i] = regs->palregs[i];
|
|
regs->palregs[i] = temp;
|
|
}
|
|
}
|
|
}
|
|
|
|
#endif // FULL_SYSTEM
|