Merge zizzer.eecs.umich.edu:/bk/newmem
into doughnut.mwconnections.com:/home/gblack/newmem-o3-micro --HG-- extra : convert_revision : 545b9e98eb1895f4b9e782224fb6615c71ed6323
This commit is contained in:
commit
4ad1b58fdd
34 changed files with 482 additions and 481 deletions
|
@ -57,10 +57,12 @@ let {{
|
||||||
addrCalcImm = 'EA = Rs1 + imm;'
|
addrCalcImm = 'EA = Rs1 + imm;'
|
||||||
iop = InstObjParams(name, Name, 'Mem',
|
iop = InstObjParams(name, Name, 'Mem',
|
||||||
{"code": code, "postacc_code" : postacc_code,
|
{"code": code, "postacc_code" : postacc_code,
|
||||||
"fault_check": faultCode, "ea_code": addrCalcReg}, opt_flags)
|
"fault_check": faultCode, "ea_code": addrCalcReg,
|
||||||
|
"EA_trunc": TruncateEA}, opt_flags)
|
||||||
iop_imm = InstObjParams(name, Name + "Imm", 'MemImm',
|
iop_imm = InstObjParams(name, Name + "Imm", 'MemImm',
|
||||||
{"code": code, "postacc_code" : postacc_code,
|
{"code": code, "postacc_code" : postacc_code,
|
||||||
"fault_check": faultCode, "ea_code": addrCalcImm}, opt_flags)
|
"fault_check": faultCode, "ea_code": addrCalcImm,
|
||||||
|
"EA_trunc": TruncateEA}, opt_flags)
|
||||||
header_output = MemDeclare.subst(iop) + MemDeclare.subst(iop_imm)
|
header_output = MemDeclare.subst(iop) + MemDeclare.subst(iop_imm)
|
||||||
decoder_output = BasicConstructor.subst(iop) + BasicConstructor.subst(iop_imm)
|
decoder_output = BasicConstructor.subst(iop) + BasicConstructor.subst(iop_imm)
|
||||||
decode_block = ROrImmDecode.subst(iop)
|
decode_block = ROrImmDecode.subst(iop)
|
||||||
|
|
|
@ -298,11 +298,13 @@ let {{
|
||||||
iop = InstObjParams(name, Name, 'BlockMem',
|
iop = InstObjParams(name, Name, 'BlockMem',
|
||||||
{"code": pcedCode, "ea_code": addrCalcReg,
|
{"code": pcedCode, "ea_code": addrCalcReg,
|
||||||
"fault_check": faultCode, "micro_pc": microPc,
|
"fault_check": faultCode, "micro_pc": microPc,
|
||||||
"set_flags": flag_code}, opt_flags)
|
"set_flags": flag_code, "EA_trunc" : TruncateEA},
|
||||||
|
opt_flags)
|
||||||
iop_imm = InstObjParams(name, Name + 'Imm', 'BlockMemImm',
|
iop_imm = InstObjParams(name, Name + 'Imm', 'BlockMemImm',
|
||||||
{"code": pcedCode, "ea_code": addrCalcImm,
|
{"code": pcedCode, "ea_code": addrCalcImm,
|
||||||
"fault_check": faultCode, "micro_pc": microPc,
|
"fault_check": faultCode, "micro_pc": microPc,
|
||||||
"set_flags": flag_code}, opt_flags)
|
"set_flags": flag_code, "EA_trunc" : TruncateEA},
|
||||||
|
opt_flags)
|
||||||
decoder_output += BlockMemMicroConstructor.subst(iop)
|
decoder_output += BlockMemMicroConstructor.subst(iop)
|
||||||
decoder_output += BlockMemMicroConstructor.subst(iop_imm)
|
decoder_output += BlockMemMicroConstructor.subst(iop_imm)
|
||||||
exec_output += doDualSplitExecute(
|
exec_output += doDualSplitExecute(
|
||||||
|
|
|
@ -51,6 +51,7 @@ def template SwapExecute {{
|
||||||
}
|
}
|
||||||
if(storeCond && fault == NoFault)
|
if(storeCond && fault == NoFault)
|
||||||
{
|
{
|
||||||
|
%(EA_trunc)s
|
||||||
fault = xc->write((uint%(mem_acc_size)s_t)Mem,
|
fault = xc->write((uint%(mem_acc_size)s_t)Mem,
|
||||||
EA, %(asi_val)s, &mem_data);
|
EA, %(asi_val)s, &mem_data);
|
||||||
}
|
}
|
||||||
|
@ -91,6 +92,7 @@ def template SwapInitiateAcc {{
|
||||||
}
|
}
|
||||||
if(fault == NoFault)
|
if(fault == NoFault)
|
||||||
{
|
{
|
||||||
|
%(EA_trunc)s
|
||||||
fault = xc->write((uint%(mem_acc_size)s_t)Mem,
|
fault = xc->write((uint%(mem_acc_size)s_t)Mem,
|
||||||
EA, %(asi_val)s, &mem_data);
|
EA, %(asi_val)s, &mem_data);
|
||||||
}
|
}
|
||||||
|
@ -157,12 +159,14 @@ let {{
|
||||||
addrCalcReg = 'EA = Rs1;'
|
addrCalcReg = 'EA = Rs1;'
|
||||||
iop = InstObjParams(name, Name, 'Mem',
|
iop = InstObjParams(name, Name, 'Mem',
|
||||||
{"code": code, "postacc_code" : postacc_code,
|
{"code": code, "postacc_code" : postacc_code,
|
||||||
"fault_check": faultCode, "ea_code": addrCalcReg}, opt_flags)
|
"fault_check": faultCode, "ea_code": addrCalcReg,
|
||||||
|
"EA_trunc" : TruncateEA}, opt_flags)
|
||||||
header_output = MemDeclare.subst(iop)
|
header_output = MemDeclare.subst(iop)
|
||||||
decoder_output = BasicConstructor.subst(iop)
|
decoder_output = BasicConstructor.subst(iop)
|
||||||
decode_block = BasicDecode.subst(iop)
|
decode_block = BasicDecode.subst(iop)
|
||||||
microParams = {"code": code, "postacc_code" : postacc_code,
|
microParams = {"code": code, "postacc_code" : postacc_code,
|
||||||
"ea_code" : addrCalcReg, "fault_check" : faultCode}
|
"ea_code" : addrCalcReg, "fault_check" : faultCode,
|
||||||
|
"EA_trunc" : TruncateEA}
|
||||||
exec_output = doSplitExecute(execute, name, Name, asi,
|
exec_output = doSplitExecute(execute, name, Name, asi,
|
||||||
["IsStoreConditional"], microParams);
|
["IsStoreConditional"], microParams);
|
||||||
return (header_output, decoder_output, exec_output, decode_block)
|
return (header_output, decoder_output, exec_output, decode_block)
|
||||||
|
|
|
@ -149,6 +149,7 @@ def template LoadExecute {{
|
||||||
%(fault_check)s;
|
%(fault_check)s;
|
||||||
if(fault == NoFault)
|
if(fault == NoFault)
|
||||||
{
|
{
|
||||||
|
%(EA_trunc)s
|
||||||
fault = xc->read(EA, (%(mem_acc_type)s%(mem_acc_size)s_t&)Mem, %(asi_val)s);
|
fault = xc->read(EA, (%(mem_acc_type)s%(mem_acc_size)s_t&)Mem, %(asi_val)s);
|
||||||
}
|
}
|
||||||
if(fault == NoFault)
|
if(fault == NoFault)
|
||||||
|
@ -179,6 +180,7 @@ def template LoadInitiateAcc {{
|
||||||
%(fault_check)s;
|
%(fault_check)s;
|
||||||
if(fault == NoFault)
|
if(fault == NoFault)
|
||||||
{
|
{
|
||||||
|
%(EA_trunc)s
|
||||||
fault = xc->read(EA, (%(mem_acc_type)s%(mem_acc_size)s_t&)Mem, %(asi_val)s);
|
fault = xc->read(EA, (%(mem_acc_type)s%(mem_acc_size)s_t&)Mem, %(asi_val)s);
|
||||||
}
|
}
|
||||||
return fault;
|
return fault;
|
||||||
|
@ -224,6 +226,7 @@ def template StoreExecute {{
|
||||||
}
|
}
|
||||||
if(storeCond && fault == NoFault)
|
if(storeCond && fault == NoFault)
|
||||||
{
|
{
|
||||||
|
%(EA_trunc)s
|
||||||
fault = xc->write((%(mem_acc_type)s%(mem_acc_size)s_t)Mem,
|
fault = xc->write((%(mem_acc_type)s%(mem_acc_size)s_t)Mem,
|
||||||
EA, %(asi_val)s, 0);
|
EA, %(asi_val)s, 0);
|
||||||
}
|
}
|
||||||
|
@ -257,6 +260,7 @@ def template StoreInitiateAcc {{
|
||||||
}
|
}
|
||||||
if(storeCond && fault == NoFault)
|
if(storeCond && fault == NoFault)
|
||||||
{
|
{
|
||||||
|
%(EA_trunc)s
|
||||||
fault = xc->write((%(mem_acc_type)s%(mem_acc_size)s_t)Mem,
|
fault = xc->write((%(mem_acc_type)s%(mem_acc_size)s_t)Mem,
|
||||||
EA, %(asi_val)s, 0);
|
EA, %(asi_val)s, 0);
|
||||||
}
|
}
|
||||||
|
@ -317,6 +321,11 @@ let {{
|
||||||
fault = new PrivilegedAction;
|
fault = new PrivilegedAction;
|
||||||
'''
|
'''
|
||||||
|
|
||||||
|
TruncateEA = '''
|
||||||
|
#if !FULL_SYSTEM
|
||||||
|
EA = Pstate<3:> ? EA<31:0> : EA;
|
||||||
|
#endif
|
||||||
|
'''
|
||||||
}};
|
}};
|
||||||
|
|
||||||
//A simple function to generate the name of the macro op of a certain
|
//A simple function to generate the name of the macro op of a certain
|
||||||
|
@ -346,7 +355,8 @@ let {{
|
||||||
(eaRegCode, nameReg, NameReg),
|
(eaRegCode, nameReg, NameReg),
|
||||||
(eaImmCode, nameImm, NameImm)):
|
(eaImmCode, nameImm, NameImm)):
|
||||||
microParams = {"code": code, "postacc_code" : postacc_code,
|
microParams = {"code": code, "postacc_code" : postacc_code,
|
||||||
"ea_code": eaCode, "fault_check": faultCode}
|
"ea_code": eaCode, "fault_check": faultCode,
|
||||||
|
"EA_trunc" : TruncateEA}
|
||||||
executeCode += doSplitExecute(execute, name, Name,
|
executeCode += doSplitExecute(execute, name, Name,
|
||||||
asi, opt_flags, microParams)
|
asi, opt_flags, microParams)
|
||||||
return executeCode
|
return executeCode
|
||||||
|
|
|
@ -149,7 +149,8 @@ def operands {{
|
||||||
'Fprs': ('ControlReg', 'udw', 'MISCREG_FPRS', None, 43),
|
'Fprs': ('ControlReg', 'udw', 'MISCREG_FPRS', None, 43),
|
||||||
'Pcr': ('ControlReg', 'udw', 'MISCREG_PCR', None, 44),
|
'Pcr': ('ControlReg', 'udw', 'MISCREG_PCR', None, 44),
|
||||||
'Pic': ('ControlReg', 'udw', 'MISCREG_PIC', None, 45),
|
'Pic': ('ControlReg', 'udw', 'MISCREG_PIC', None, 45),
|
||||||
'Gsr': ('ControlReg', 'udw', 'MISCREG_GSR', None, 46),
|
# 'Gsr': ('ControlReg', 'udw', 'MISCREG_GSR', (None, None, ['IsSerializeAfter','IsSerializing','IsNonSpeculative']), 46),
|
||||||
|
'Gsr': ('IntReg', 'udw', 'NumIntArchRegs + 8', None, 46),
|
||||||
'Softint': ('ControlReg', 'udw', 'MISCREG_SOFTINT', None, 47),
|
'Softint': ('ControlReg', 'udw', 'MISCREG_SOFTINT', None, 47),
|
||||||
'SoftintSet': ('ControlReg', 'udw', 'MISCREG_SOFTINT_SET', None, 48),
|
'SoftintSet': ('ControlReg', 'udw', 'MISCREG_SOFTINT_SET', None, 48),
|
||||||
'SoftintClr': ('ControlReg', 'udw', 'MISCREG_SOFTINT_CLR', None, 49),
|
'SoftintClr': ('ControlReg', 'udw', 'MISCREG_SOFTINT_CLR', None, 49),
|
||||||
|
@ -187,7 +188,7 @@ def operands {{
|
||||||
'Hver': ('ControlReg', 'udw', 'MISCREG_HVER', None, 74),
|
'Hver': ('ControlReg', 'udw', 'MISCREG_HVER', None, 74),
|
||||||
'StrandStsReg': ('ControlReg', 'udw', 'MISCREG_STRAND_STS_REG', None, 75),
|
'StrandStsReg': ('ControlReg', 'udw', 'MISCREG_STRAND_STS_REG', None, 75),
|
||||||
|
|
||||||
'Fsr': ('ControlReg', 'udw', 'MISCREG_FSR', None, 80),
|
'Fsr': ('ControlReg', 'udw', 'MISCREG_FSR', (None, None, ['IsSerializeAfter','IsSerializing','IsNonSpeculative']), 80),
|
||||||
# Mem gets a large number so it's always last
|
# Mem gets a large number so it's always last
|
||||||
'Mem': ('Mem', 'udw', None, ('IsMemRef', 'IsLoad', 'IsStore'), 100)
|
'Mem': ('Mem', 'udw', None, ('IsMemRef', 'IsLoad', 'IsStore'), 100)
|
||||||
|
|
||||||
|
|
|
@ -58,7 +58,7 @@ namespace SparcISA
|
||||||
|
|
||||||
// These enumerate all the registers for dependence tracking.
|
// These enumerate all the registers for dependence tracking.
|
||||||
enum DependenceTags {
|
enum DependenceTags {
|
||||||
FP_Base_DepTag = 32*3+8,
|
FP_Base_DepTag = 32*3+9,
|
||||||
Ctrl_Base_DepTag = FP_Base_DepTag + 64
|
Ctrl_Base_DepTag = FP_Base_DepTag + 64
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
|
@ -87,8 +87,8 @@ Sparc32LiveProcess::startup()
|
||||||
|
|
||||||
//From the SPARC ABI
|
//From the SPARC ABI
|
||||||
|
|
||||||
//The process runs in user mode
|
//The process runs in user mode with 32 bit addresses
|
||||||
threadContexts[0]->setMiscReg(MISCREG_PSTATE, 0x02);
|
threadContexts[0]->setMiscReg(MISCREG_PSTATE, 0x0a);
|
||||||
|
|
||||||
//Setup default FP state
|
//Setup default FP state
|
||||||
threadContexts[0]->setMiscRegNoEffect(MISCREG_FSR, 0);
|
threadContexts[0]->setMiscRegNoEffect(MISCREG_FSR, 0);
|
||||||
|
|
|
@ -42,7 +42,7 @@ namespace SparcISA
|
||||||
// Number of register windows, can legally be 3 to 32
|
// Number of register windows, can legally be 3 to 32
|
||||||
const int NWindows = 8;
|
const int NWindows = 8;
|
||||||
//const int NumMicroIntRegs = 1;
|
//const int NumMicroIntRegs = 1;
|
||||||
const int NumMicroIntRegs = 8;
|
const int NumMicroIntRegs = 9;
|
||||||
|
|
||||||
// const int NumRegularIntRegs = MaxGL * 8 + NWindows * 16;
|
// const int NumRegularIntRegs = MaxGL * 8 + NWindows * 16;
|
||||||
// const int NumMicroIntRegs = 1;
|
// const int NumMicroIntRegs = 1;
|
||||||
|
|
|
@ -59,7 +59,7 @@ namespace SparcISA
|
||||||
|
|
||||||
typedef int RegContextVal;
|
typedef int RegContextVal;
|
||||||
|
|
||||||
typedef uint8_t RegIndex;
|
typedef uint16_t RegIndex;
|
||||||
}
|
}
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -209,6 +209,9 @@ class BaseDynInst : public FastAlloc, public RefCounted
|
||||||
/** PC of this instruction. */
|
/** PC of this instruction. */
|
||||||
Addr PC;
|
Addr PC;
|
||||||
|
|
||||||
|
/** Micro PC of this instruction. */
|
||||||
|
Addr microPC;
|
||||||
|
|
||||||
protected:
|
protected:
|
||||||
/** Next non-speculative PC. It is not filled in at fetch, but rather
|
/** Next non-speculative PC. It is not filled in at fetch, but rather
|
||||||
* once the target of the branch is truly known (either decode or
|
* once the target of the branch is truly known (either decode or
|
||||||
|
@ -219,12 +222,18 @@ class BaseDynInst : public FastAlloc, public RefCounted
|
||||||
/** Next non-speculative NPC. Target PC for Mips or Sparc. */
|
/** Next non-speculative NPC. Target PC for Mips or Sparc. */
|
||||||
Addr nextNPC;
|
Addr nextNPC;
|
||||||
|
|
||||||
|
/** Next non-speculative micro PC. */
|
||||||
|
Addr nextMicroPC;
|
||||||
|
|
||||||
/** Predicted next PC. */
|
/** Predicted next PC. */
|
||||||
Addr predPC;
|
Addr predPC;
|
||||||
|
|
||||||
/** Predicted next NPC. */
|
/** Predicted next NPC. */
|
||||||
Addr predNPC;
|
Addr predNPC;
|
||||||
|
|
||||||
|
/** Predicted next microPC */
|
||||||
|
Addr predMicroPC;
|
||||||
|
|
||||||
/** If this is a branch that was predicted taken */
|
/** If this is a branch that was predicted taken */
|
||||||
bool predTaken;
|
bool predTaken;
|
||||||
|
|
||||||
|
@ -340,6 +349,17 @@ class BaseDynInst : public FastAlloc, public RefCounted
|
||||||
{
|
{
|
||||||
_flatDestRegIdx[idx] = flattened_dest;
|
_flatDestRegIdx[idx] = flattened_dest;
|
||||||
}
|
}
|
||||||
|
/** BaseDynInst constructor given a binary instruction.
|
||||||
|
* @param staticInst A StaticInstPtr to the underlying instruction.
|
||||||
|
* @param PC The PC of the instruction.
|
||||||
|
* @param pred_PC The predicted next PC.
|
||||||
|
* @param pred_NPC The predicted next NPC.
|
||||||
|
* @param seq_num The sequence number of the instruction.
|
||||||
|
* @param cpu Pointer to the instruction's CPU.
|
||||||
|
*/
|
||||||
|
BaseDynInst(StaticInstPtr staticInst, Addr PC, Addr NPC, Addr microPC,
|
||||||
|
Addr pred_PC, Addr pred_NPC, Addr pred_MicroPC,
|
||||||
|
InstSeqNum seq_num, ImplCPU *cpu);
|
||||||
|
|
||||||
/** BaseDynInst constructor given a binary instruction.
|
/** BaseDynInst constructor given a binary instruction.
|
||||||
* @param inst The binary instruction.
|
* @param inst The binary instruction.
|
||||||
|
@ -349,8 +369,8 @@ class BaseDynInst : public FastAlloc, public RefCounted
|
||||||
* @param seq_num The sequence number of the instruction.
|
* @param seq_num The sequence number of the instruction.
|
||||||
* @param cpu Pointer to the instruction's CPU.
|
* @param cpu Pointer to the instruction's CPU.
|
||||||
*/
|
*/
|
||||||
BaseDynInst(TheISA::ExtMachInst inst, Addr PC, Addr NPC,
|
BaseDynInst(TheISA::ExtMachInst inst, Addr PC, Addr NPC, Addr microPC,
|
||||||
Addr pred_PC, Addr pred_NPC,
|
Addr pred_PC, Addr pred_NPC, Addr pred_MicroPC,
|
||||||
InstSeqNum seq_num, ImplCPU *cpu);
|
InstSeqNum seq_num, ImplCPU *cpu);
|
||||||
|
|
||||||
/** BaseDynInst constructor given a StaticInst pointer.
|
/** BaseDynInst constructor given a StaticInst pointer.
|
||||||
|
@ -402,11 +422,18 @@ class BaseDynInst : public FastAlloc, public RefCounted
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Addr readNextMicroPC()
|
||||||
|
{
|
||||||
|
return nextMicroPC;
|
||||||
|
}
|
||||||
|
|
||||||
/** Set the predicted target of this current instruction. */
|
/** Set the predicted target of this current instruction. */
|
||||||
void setPredTarg(Addr predicted_PC, Addr predicted_NPC)
|
void setPredTarg(Addr predicted_PC, Addr predicted_NPC,
|
||||||
|
Addr predicted_MicroPC)
|
||||||
{
|
{
|
||||||
predPC = predicted_PC;
|
predPC = predicted_PC;
|
||||||
predNPC = predicted_NPC;
|
predNPC = predicted_NPC;
|
||||||
|
predMicroPC = predicted_MicroPC;
|
||||||
}
|
}
|
||||||
|
|
||||||
/** Returns the predicted PC immediately after the branch. */
|
/** Returns the predicted PC immediately after the branch. */
|
||||||
|
@ -415,6 +442,9 @@ class BaseDynInst : public FastAlloc, public RefCounted
|
||||||
/** Returns the predicted PC two instructions after the branch */
|
/** Returns the predicted PC two instructions after the branch */
|
||||||
Addr readPredNPC() { return predNPC; }
|
Addr readPredNPC() { return predNPC; }
|
||||||
|
|
||||||
|
/** Returns the predicted micro PC after the branch */
|
||||||
|
Addr readPredMicroPC() { return predMicroPC; }
|
||||||
|
|
||||||
/** Returns whether the instruction was predicted taken or not. */
|
/** Returns whether the instruction was predicted taken or not. */
|
||||||
bool readPredTaken()
|
bool readPredTaken()
|
||||||
{
|
{
|
||||||
|
@ -430,7 +460,8 @@ class BaseDynInst : public FastAlloc, public RefCounted
|
||||||
bool mispredicted()
|
bool mispredicted()
|
||||||
{
|
{
|
||||||
return readPredPC() != readNextPC() ||
|
return readPredPC() != readNextPC() ||
|
||||||
readPredNPC() != readNextNPC();
|
readPredNPC() != readNextNPC() ||
|
||||||
|
readPredMicroPC() != readNextMicroPC();
|
||||||
}
|
}
|
||||||
|
|
||||||
//
|
//
|
||||||
|
@ -467,6 +498,12 @@ class BaseDynInst : public FastAlloc, public RefCounted
|
||||||
bool isQuiesce() const { return staticInst->isQuiesce(); }
|
bool isQuiesce() const { return staticInst->isQuiesce(); }
|
||||||
bool isIprAccess() const { return staticInst->isIprAccess(); }
|
bool isIprAccess() const { return staticInst->isIprAccess(); }
|
||||||
bool isUnverifiable() const { return staticInst->isUnverifiable(); }
|
bool isUnverifiable() const { return staticInst->isUnverifiable(); }
|
||||||
|
bool isMacroOp() const { return staticInst->isMacroOp(); }
|
||||||
|
bool isMicroOp() const { return staticInst->isMicroOp(); }
|
||||||
|
bool isDelayedCommit() const { return staticInst->isDelayedCommit(); }
|
||||||
|
bool isLastMicroOp() const { return staticInst->isLastMicroOp(); }
|
||||||
|
bool isFirstMicroOp() const { return staticInst->isFirstMicroOp(); }
|
||||||
|
bool isMicroBranch() const { return staticInst->isMicroBranch(); }
|
||||||
|
|
||||||
/** Temporarily sets this instruction as a serialize before instruction. */
|
/** Temporarily sets this instruction as a serialize before instruction. */
|
||||||
void setSerializeBefore() { status.set(SerializeBefore); }
|
void setSerializeBefore() { status.set(SerializeBefore); }
|
||||||
|
@ -700,16 +737,26 @@ class BaseDynInst : public FastAlloc, public RefCounted
|
||||||
/** Read the PC of this instruction. */
|
/** Read the PC of this instruction. */
|
||||||
const Addr readPC() const { return PC; }
|
const Addr readPC() const { return PC; }
|
||||||
|
|
||||||
|
/**Read the micro PC of this instruction. */
|
||||||
|
const Addr readMicroPC() const { return microPC; }
|
||||||
|
|
||||||
/** Set the next PC of this instruction (its actual target). */
|
/** Set the next PC of this instruction (its actual target). */
|
||||||
void setNextPC(uint64_t val)
|
void setNextPC(Addr val)
|
||||||
{
|
{
|
||||||
nextPC = val;
|
nextPC = val;
|
||||||
}
|
}
|
||||||
|
|
||||||
/** Set the next NPC of this instruction (the target in Mips or Sparc).*/
|
/** Set the next NPC of this instruction (the target in Mips or Sparc).*/
|
||||||
void setNextNPC(uint64_t val)
|
void setNextNPC(Addr val)
|
||||||
{
|
{
|
||||||
|
#if ISA_HAS_DELAY_SLOT
|
||||||
nextNPC = val;
|
nextNPC = val;
|
||||||
|
#endif
|
||||||
|
}
|
||||||
|
|
||||||
|
void setNextMicroPC(Addr val)
|
||||||
|
{
|
||||||
|
nextMicroPC = val;
|
||||||
}
|
}
|
||||||
|
|
||||||
/** Sets the ASID. */
|
/** Sets the ASID. */
|
||||||
|
|
|
@ -62,19 +62,66 @@ my_hash_t thishash;
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
BaseDynInst<Impl>::BaseDynInst(TheISA::ExtMachInst machInst,
|
BaseDynInst<Impl>::BaseDynInst(StaticInstPtr _staticInst,
|
||||||
Addr inst_PC, Addr inst_NPC,
|
Addr inst_PC, Addr inst_NPC,
|
||||||
|
Addr inst_MicroPC,
|
||||||
Addr pred_PC, Addr pred_NPC,
|
Addr pred_PC, Addr pred_NPC,
|
||||||
|
Addr pred_MicroPC,
|
||||||
InstSeqNum seq_num, ImplCPU *cpu)
|
InstSeqNum seq_num, ImplCPU *cpu)
|
||||||
: staticInst(machInst), traceData(NULL), cpu(cpu)
|
: staticInst(_staticInst), traceData(NULL), cpu(cpu)
|
||||||
{
|
{
|
||||||
seqNum = seq_num;
|
seqNum = seq_num;
|
||||||
|
|
||||||
|
bool nextIsMicro =
|
||||||
|
staticInst->isMicroOp() && !staticInst->isLastMicroOp();
|
||||||
|
|
||||||
PC = inst_PC;
|
PC = inst_PC;
|
||||||
|
microPC = inst_MicroPC;
|
||||||
|
if (nextIsMicro) {
|
||||||
|
nextPC = inst_PC;
|
||||||
|
nextNPC = inst_NPC;
|
||||||
|
nextMicroPC = microPC + 1;
|
||||||
|
} else {
|
||||||
nextPC = inst_NPC;
|
nextPC = inst_NPC;
|
||||||
nextNPC = nextPC + sizeof(TheISA::MachInst);
|
nextNPC = nextPC + sizeof(TheISA::MachInst);
|
||||||
|
nextMicroPC = 0;
|
||||||
|
}
|
||||||
predPC = pred_PC;
|
predPC = pred_PC;
|
||||||
predNPC = pred_NPC;
|
predNPC = pred_NPC;
|
||||||
|
predMicroPC = pred_MicroPC;
|
||||||
|
predTaken = false;
|
||||||
|
|
||||||
|
initVars();
|
||||||
|
}
|
||||||
|
|
||||||
|
template <class Impl>
|
||||||
|
BaseDynInst<Impl>::BaseDynInst(TheISA::ExtMachInst inst,
|
||||||
|
Addr inst_PC, Addr inst_NPC,
|
||||||
|
Addr inst_MicroPC,
|
||||||
|
Addr pred_PC, Addr pred_NPC,
|
||||||
|
Addr pred_MicroPC,
|
||||||
|
InstSeqNum seq_num, ImplCPU *cpu)
|
||||||
|
: staticInst(inst), traceData(NULL), cpu(cpu)
|
||||||
|
{
|
||||||
|
seqNum = seq_num;
|
||||||
|
|
||||||
|
bool nextIsMicro =
|
||||||
|
staticInst->isMicroOp() && !staticInst->isLastMicroOp();
|
||||||
|
|
||||||
|
PC = inst_PC;
|
||||||
|
microPC = inst_MicroPC;
|
||||||
|
if (nextIsMicro) {
|
||||||
|
nextPC = inst_PC;
|
||||||
|
nextNPC = inst_NPC;
|
||||||
|
nextMicroPC = microPC + 1;
|
||||||
|
} else {
|
||||||
|
nextPC = inst_NPC;
|
||||||
|
nextNPC = nextPC + sizeof(TheISA::MachInst);
|
||||||
|
nextMicroPC = 0;
|
||||||
|
}
|
||||||
|
predPC = pred_PC;
|
||||||
|
predNPC = pred_NPC;
|
||||||
|
predMicroPC = pred_MicroPC;
|
||||||
predTaken = false;
|
predTaken = false;
|
||||||
|
|
||||||
initVars();
|
initVars();
|
||||||
|
|
|
@ -73,8 +73,13 @@ class AlphaDynInst : public BaseDynInst<Impl>
|
||||||
|
|
||||||
public:
|
public:
|
||||||
/** BaseDynInst constructor given a binary instruction. */
|
/** BaseDynInst constructor given a binary instruction. */
|
||||||
AlphaDynInst(ExtMachInst inst, Addr PC, Addr NPC,
|
AlphaDynInst(StaticInstPtr staticInst, Addr PC, Addr NPC, Addr microPC,
|
||||||
Addr Pred_PC, Addr Pred_NPC,
|
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
|
||||||
|
InstSeqNum seq_num, O3CPU *cpu);
|
||||||
|
|
||||||
|
/** BaseDynInst constructor given a binary instruction. */
|
||||||
|
AlphaDynInst(ExtMachInst inst, Addr PC, Addr NPC, Addr microPC,
|
||||||
|
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
|
||||||
InstSeqNum seq_num, O3CPU *cpu);
|
InstSeqNum seq_num, O3CPU *cpu);
|
||||||
|
|
||||||
/** BaseDynInst constructor given a static inst pointer. */
|
/** BaseDynInst constructor given a static inst pointer. */
|
||||||
|
|
|
@ -31,10 +31,25 @@
|
||||||
#include "cpu/o3/alpha/dyn_inst.hh"
|
#include "cpu/o3/alpha/dyn_inst.hh"
|
||||||
|
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
AlphaDynInst<Impl>::AlphaDynInst(ExtMachInst inst, Addr PC, Addr NPC,
|
AlphaDynInst<Impl>::AlphaDynInst(StaticInstPtr staticInst,
|
||||||
|
Addr PC, Addr NPC, Addr microPC,
|
||||||
Addr Pred_PC, Addr Pred_NPC,
|
Addr Pred_PC, Addr Pred_NPC,
|
||||||
|
Addr Pred_MicroPC,
|
||||||
InstSeqNum seq_num, O3CPU *cpu)
|
InstSeqNum seq_num, O3CPU *cpu)
|
||||||
: BaseDynInst<Impl>(inst, PC, NPC, Pred_PC, Pred_NPC, seq_num, cpu)
|
: BaseDynInst<Impl>(staticInst, PC, NPC, microPC,
|
||||||
|
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
|
||||||
|
{
|
||||||
|
initVars();
|
||||||
|
}
|
||||||
|
|
||||||
|
template <class Impl>
|
||||||
|
AlphaDynInst<Impl>::AlphaDynInst(ExtMachInst inst,
|
||||||
|
Addr PC, Addr NPC, Addr microPC,
|
||||||
|
Addr Pred_PC, Addr Pred_NPC,
|
||||||
|
Addr Pred_MicroPC,
|
||||||
|
InstSeqNum seq_num, O3CPU *cpu)
|
||||||
|
: BaseDynInst<Impl>(inst, PC, NPC, microPC,
|
||||||
|
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
|
||||||
{
|
{
|
||||||
initVars();
|
initVars();
|
||||||
}
|
}
|
||||||
|
|
|
@ -87,10 +87,10 @@ struct DefaultIEWDefaultCommit {
|
||||||
bool squash[Impl::MaxThreads];
|
bool squash[Impl::MaxThreads];
|
||||||
bool branchMispredict[Impl::MaxThreads];
|
bool branchMispredict[Impl::MaxThreads];
|
||||||
bool branchTaken[Impl::MaxThreads];
|
bool branchTaken[Impl::MaxThreads];
|
||||||
bool squashDelaySlot[Impl::MaxThreads];
|
Addr mispredPC[Impl::MaxThreads];
|
||||||
uint64_t mispredPC[Impl::MaxThreads];
|
Addr nextPC[Impl::MaxThreads];
|
||||||
uint64_t nextPC[Impl::MaxThreads];
|
Addr nextNPC[Impl::MaxThreads];
|
||||||
uint64_t nextNPC[Impl::MaxThreads];
|
Addr nextMicroPC[Impl::MaxThreads];
|
||||||
InstSeqNum squashedSeqNum[Impl::MaxThreads];
|
InstSeqNum squashedSeqNum[Impl::MaxThreads];
|
||||||
|
|
||||||
bool includeSquashInst[Impl::MaxThreads];
|
bool includeSquashInst[Impl::MaxThreads];
|
||||||
|
@ -114,15 +114,15 @@ struct TimeBufStruct {
|
||||||
uint64_t branchAddr;
|
uint64_t branchAddr;
|
||||||
|
|
||||||
InstSeqNum doneSeqNum;
|
InstSeqNum doneSeqNum;
|
||||||
InstSeqNum bdelayDoneSeqNum;
|
|
||||||
|
|
||||||
// @todo: Might want to package this kind of branch stuff into a single
|
// @todo: Might want to package this kind of branch stuff into a single
|
||||||
// struct as it is used pretty frequently.
|
// struct as it is used pretty frequently.
|
||||||
bool branchMispredict;
|
bool branchMispredict;
|
||||||
bool branchTaken;
|
bool branchTaken;
|
||||||
uint64_t mispredPC;
|
Addr mispredPC;
|
||||||
uint64_t nextPC;
|
Addr nextPC;
|
||||||
uint64_t nextNPC;
|
Addr nextNPC;
|
||||||
|
Addr nextMicroPC;
|
||||||
|
|
||||||
unsigned branchCount;
|
unsigned branchCount;
|
||||||
};
|
};
|
||||||
|
@ -160,18 +160,16 @@ struct TimeBufStruct {
|
||||||
|
|
||||||
bool branchMispredict;
|
bool branchMispredict;
|
||||||
bool branchTaken;
|
bool branchTaken;
|
||||||
uint64_t mispredPC;
|
Addr mispredPC;
|
||||||
uint64_t nextPC;
|
Addr nextPC;
|
||||||
uint64_t nextNPC;
|
Addr nextNPC;
|
||||||
|
Addr nextMicroPC;
|
||||||
|
|
||||||
// Represents the instruction that has either been retired or
|
// Represents the instruction that has either been retired or
|
||||||
// squashed. Similar to having a single bus that broadcasts the
|
// squashed. Similar to having a single bus that broadcasts the
|
||||||
// retired or squashed sequence number.
|
// retired or squashed sequence number.
|
||||||
InstSeqNum doneSeqNum;
|
InstSeqNum doneSeqNum;
|
||||||
|
|
||||||
InstSeqNum bdelayDoneSeqNum;
|
|
||||||
bool squashDelaySlot;
|
|
||||||
|
|
||||||
//Just in case we want to do a commit/squash on a cycle
|
//Just in case we want to do a commit/squash on a cycle
|
||||||
//(necessary for multiple ROBs?)
|
//(necessary for multiple ROBs?)
|
||||||
bool commitInsts;
|
bool commitInsts;
|
||||||
|
|
|
@ -279,25 +279,37 @@ class DefaultCommit
|
||||||
/** Returns the PC of the head instruction of the ROB.
|
/** Returns the PC of the head instruction of the ROB.
|
||||||
* @todo: Probably remove this function as it returns only thread 0.
|
* @todo: Probably remove this function as it returns only thread 0.
|
||||||
*/
|
*/
|
||||||
uint64_t readPC() { return PC[0]; }
|
Addr readPC() { return PC[0]; }
|
||||||
|
|
||||||
/** Returns the PC of a specific thread. */
|
/** Returns the PC of a specific thread. */
|
||||||
uint64_t readPC(unsigned tid) { return PC[tid]; }
|
Addr readPC(unsigned tid) { return PC[tid]; }
|
||||||
|
|
||||||
/** Sets the PC of a specific thread. */
|
/** Sets the PC of a specific thread. */
|
||||||
void setPC(uint64_t val, unsigned tid) { PC[tid] = val; }
|
void setPC(Addr val, unsigned tid) { PC[tid] = val; }
|
||||||
|
|
||||||
|
/** Reads the micro PC of a specific thread. */
|
||||||
|
Addr readMicroPC(unsigned tid) { return microPC[tid]; }
|
||||||
|
|
||||||
|
/** Sets the micro PC of a specific thread */
|
||||||
|
void setMicroPC(Addr val, unsigned tid) { microPC[tid] = val; }
|
||||||
|
|
||||||
/** Reads the next PC of a specific thread. */
|
/** Reads the next PC of a specific thread. */
|
||||||
uint64_t readNextPC(unsigned tid) { return nextPC[tid]; }
|
Addr readNextPC(unsigned tid) { return nextPC[tid]; }
|
||||||
|
|
||||||
/** Sets the next PC of a specific thread. */
|
/** Sets the next PC of a specific thread. */
|
||||||
void setNextPC(uint64_t val, unsigned tid) { nextPC[tid] = val; }
|
void setNextPC(Addr val, unsigned tid) { nextPC[tid] = val; }
|
||||||
|
|
||||||
/** Reads the next NPC of a specific thread. */
|
/** Reads the next NPC of a specific thread. */
|
||||||
uint64_t readNextNPC(unsigned tid) { return nextNPC[tid]; }
|
Addr readNextNPC(unsigned tid) { return nextNPC[tid]; }
|
||||||
|
|
||||||
/** Sets the next NPC of a specific thread. */
|
/** Sets the next NPC of a specific thread. */
|
||||||
void setNextNPC(uint64_t val, unsigned tid) { nextNPC[tid] = val; }
|
void setNextNPC(Addr val, unsigned tid) { nextNPC[tid] = val; }
|
||||||
|
|
||||||
|
/** Reads the micro PC of a specific thread. */
|
||||||
|
Addr readNextMicroPC(unsigned tid) { return nextMicroPC[tid]; }
|
||||||
|
|
||||||
|
/** Sets the micro PC of a specific thread */
|
||||||
|
void setNextMicroPC(Addr val, unsigned tid) { nextMicroPC[tid] = val; }
|
||||||
|
|
||||||
private:
|
private:
|
||||||
/** Time buffer interface. */
|
/** Time buffer interface. */
|
||||||
|
@ -402,12 +414,20 @@ class DefaultCommit
|
||||||
*/
|
*/
|
||||||
Addr PC[Impl::MaxThreads];
|
Addr PC[Impl::MaxThreads];
|
||||||
|
|
||||||
|
/** The commit micro PC of each thread. Refers to the instruction that
|
||||||
|
* is currently being processed/committed.
|
||||||
|
*/
|
||||||
|
Addr microPC[Impl::MaxThreads];
|
||||||
|
|
||||||
/** The next PC of each thread. */
|
/** The next PC of each thread. */
|
||||||
Addr nextPC[Impl::MaxThreads];
|
Addr nextPC[Impl::MaxThreads];
|
||||||
|
|
||||||
/** The next NPC of each thread. */
|
/** The next NPC of each thread. */
|
||||||
Addr nextNPC[Impl::MaxThreads];
|
Addr nextNPC[Impl::MaxThreads];
|
||||||
|
|
||||||
|
/** The next micro PC of each thread. */
|
||||||
|
Addr nextMicroPC[Impl::MaxThreads];
|
||||||
|
|
||||||
/** The sequence number of the youngest valid instruction in the ROB. */
|
/** The sequence number of the youngest valid instruction in the ROB. */
|
||||||
InstSeqNum youngestSeqNum[Impl::MaxThreads];
|
InstSeqNum youngestSeqNum[Impl::MaxThreads];
|
||||||
|
|
||||||
|
|
|
@ -124,7 +124,7 @@ DefaultCommit<Impl>::DefaultCommit(O3CPU *_cpu, Params *params)
|
||||||
committedStores[i] = false;
|
committedStores[i] = false;
|
||||||
trapSquash[i] = false;
|
trapSquash[i] = false;
|
||||||
tcSquash[i] = false;
|
tcSquash[i] = false;
|
||||||
PC[i] = nextPC[i] = nextNPC[i] = 0;
|
microPC[i] = nextMicroPC[i] = PC[i] = nextPC[i] = nextNPC[i] = 0;
|
||||||
}
|
}
|
||||||
#if FULL_SYSTEM
|
#if FULL_SYSTEM
|
||||||
interrupt = NoFault;
|
interrupt = NoFault;
|
||||||
|
@ -508,6 +508,7 @@ DefaultCommit<Impl>::squashAll(unsigned tid)
|
||||||
|
|
||||||
toIEW->commitInfo[tid].nextPC = PC[tid];
|
toIEW->commitInfo[tid].nextPC = PC[tid];
|
||||||
toIEW->commitInfo[tid].nextNPC = nextPC[tid];
|
toIEW->commitInfo[tid].nextNPC = nextPC[tid];
|
||||||
|
toIEW->commitInfo[tid].nextMicroPC = nextMicroPC[tid];
|
||||||
}
|
}
|
||||||
|
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
|
@ -738,38 +739,15 @@ DefaultCommit<Impl>::commit()
|
||||||
// then use one older sequence number.
|
// then use one older sequence number.
|
||||||
InstSeqNum squashed_inst = fromIEW->squashedSeqNum[tid];
|
InstSeqNum squashed_inst = fromIEW->squashedSeqNum[tid];
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
InstSeqNum bdelay_done_seq_num = squashed_inst;
|
|
||||||
bool squash_bdelay_slot = fromIEW->squashDelaySlot[tid];
|
|
||||||
bool branchMispredict = fromIEW->branchMispredict[tid];
|
|
||||||
|
|
||||||
// Squashing/not squashing the branch delay slot only makes
|
|
||||||
// sense when you're squashing from a branch, ie from a branch
|
|
||||||
// mispredict.
|
|
||||||
if (branchMispredict && !squash_bdelay_slot) {
|
|
||||||
bdelay_done_seq_num++;
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
|
|
||||||
if (fromIEW->includeSquashInst[tid] == true) {
|
if (fromIEW->includeSquashInst[tid] == true) {
|
||||||
squashed_inst--;
|
squashed_inst--;
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
bdelay_done_seq_num--;
|
|
||||||
#endif
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// All younger instructions will be squashed. Set the sequence
|
// All younger instructions will be squashed. Set the sequence
|
||||||
// number as the youngest instruction in the ROB.
|
// number as the youngest instruction in the ROB.
|
||||||
youngestSeqNum[tid] = squashed_inst;
|
youngestSeqNum[tid] = squashed_inst;
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
rob->squash(bdelay_done_seq_num, tid);
|
|
||||||
toIEW->commitInfo[tid].squashDelaySlot = squash_bdelay_slot;
|
|
||||||
toIEW->commitInfo[tid].bdelayDoneSeqNum = bdelay_done_seq_num;
|
|
||||||
#else
|
|
||||||
rob->squash(squashed_inst, tid);
|
rob->squash(squashed_inst, tid);
|
||||||
toIEW->commitInfo[tid].squashDelaySlot = true;
|
|
||||||
#endif
|
|
||||||
changedROBNumEntries[tid] = true;
|
changedROBNumEntries[tid] = true;
|
||||||
|
|
||||||
toIEW->commitInfo[tid].doneSeqNum = squashed_inst;
|
toIEW->commitInfo[tid].doneSeqNum = squashed_inst;
|
||||||
|
@ -788,6 +766,7 @@ DefaultCommit<Impl>::commit()
|
||||||
|
|
||||||
toIEW->commitInfo[tid].nextPC = fromIEW->nextPC[tid];
|
toIEW->commitInfo[tid].nextPC = fromIEW->nextPC[tid];
|
||||||
toIEW->commitInfo[tid].nextNPC = fromIEW->nextNPC[tid];
|
toIEW->commitInfo[tid].nextNPC = fromIEW->nextNPC[tid];
|
||||||
|
toIEW->commitInfo[tid].nextMicroPC = fromIEW->nextMicroPC[tid];
|
||||||
|
|
||||||
toIEW->commitInfo[tid].mispredPC = fromIEW->mispredPC[tid];
|
toIEW->commitInfo[tid].mispredPC = fromIEW->mispredPC[tid];
|
||||||
|
|
||||||
|
@ -806,10 +785,6 @@ DefaultCommit<Impl>::commit()
|
||||||
|
|
||||||
// Try to commit any instructions.
|
// Try to commit any instructions.
|
||||||
commitInsts();
|
commitInsts();
|
||||||
} else {
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
skidInsert();
|
|
||||||
#endif
|
|
||||||
}
|
}
|
||||||
|
|
||||||
//Check for any activity
|
//Check for any activity
|
||||||
|
@ -901,6 +876,7 @@ DefaultCommit<Impl>::commitInsts()
|
||||||
PC[tid] = head_inst->readPC();
|
PC[tid] = head_inst->readPC();
|
||||||
nextPC[tid] = head_inst->readNextPC();
|
nextPC[tid] = head_inst->readNextPC();
|
||||||
nextNPC[tid] = head_inst->readNextNPC();
|
nextNPC[tid] = head_inst->readNextNPC();
|
||||||
|
nextMicroPC[tid] = head_inst->readNextMicroPC();
|
||||||
|
|
||||||
// Increment the total number of non-speculative instructions
|
// Increment the total number of non-speculative instructions
|
||||||
// executed.
|
// executed.
|
||||||
|
@ -929,12 +905,10 @@ DefaultCommit<Impl>::commitInsts()
|
||||||
}
|
}
|
||||||
|
|
||||||
PC[tid] = nextPC[tid];
|
PC[tid] = nextPC[tid];
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
nextPC[tid] = nextNPC[tid];
|
nextPC[tid] = nextNPC[tid];
|
||||||
nextNPC[tid] = nextNPC[tid] + sizeof(TheISA::MachInst);
|
nextNPC[tid] = nextNPC[tid] + sizeof(TheISA::MachInst);
|
||||||
#else
|
microPC[tid] = nextMicroPC[tid];
|
||||||
nextPC[tid] = nextPC[tid] + sizeof(TheISA::MachInst);
|
nextMicroPC[tid] = microPC[tid] + 1;
|
||||||
#endif
|
|
||||||
|
|
||||||
#if FULL_SYSTEM
|
#if FULL_SYSTEM
|
||||||
int count = 0;
|
int count = 0;
|
||||||
|
@ -1161,37 +1135,13 @@ DefaultCommit<Impl>::getInsts()
|
||||||
{
|
{
|
||||||
DPRINTF(Commit, "Getting instructions from Rename stage.\n");
|
DPRINTF(Commit, "Getting instructions from Rename stage.\n");
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
// Read any renamed instructions and place them into the ROB.
|
|
||||||
int insts_to_process = std::min((int)renameWidth,
|
|
||||||
(int)(fromRename->size + skidBuffer.size()));
|
|
||||||
int rename_idx = 0;
|
|
||||||
|
|
||||||
DPRINTF(Commit, "%i insts available to process. Rename Insts:%i "
|
|
||||||
"SkidBuffer Insts:%i\n", insts_to_process, fromRename->size,
|
|
||||||
skidBuffer.size());
|
|
||||||
#else
|
|
||||||
// Read any renamed instructions and place them into the ROB.
|
// Read any renamed instructions and place them into the ROB.
|
||||||
int insts_to_process = std::min((int)renameWidth, fromRename->size);
|
int insts_to_process = std::min((int)renameWidth, fromRename->size);
|
||||||
#endif
|
|
||||||
|
|
||||||
|
|
||||||
for (int inst_num = 0; inst_num < insts_to_process; ++inst_num) {
|
for (int inst_num = 0; inst_num < insts_to_process; ++inst_num) {
|
||||||
DynInstPtr inst;
|
DynInstPtr inst;
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
// Get insts from skidBuffer or from Rename
|
|
||||||
if (skidBuffer.size() > 0) {
|
|
||||||
DPRINTF(Commit, "Grabbing skidbuffer inst.\n");
|
|
||||||
inst = skidBuffer.front();
|
|
||||||
skidBuffer.pop();
|
|
||||||
} else {
|
|
||||||
DPRINTF(Commit, "Grabbing rename inst.\n");
|
|
||||||
inst = fromRename->insts[rename_idx++];
|
|
||||||
}
|
|
||||||
#else
|
|
||||||
inst = fromRename->insts[inst_num];
|
inst = fromRename->insts[inst_num];
|
||||||
#endif
|
|
||||||
int tid = inst->threadNumber;
|
int tid = inst->threadNumber;
|
||||||
|
|
||||||
if (!inst->isSquashed() &&
|
if (!inst->isSquashed() &&
|
||||||
|
@ -1213,30 +1163,6 @@ DefaultCommit<Impl>::getInsts()
|
||||||
inst->readPC(), inst->seqNum, tid);
|
inst->readPC(), inst->seqNum, tid);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
if (rename_idx < fromRename->size) {
|
|
||||||
DPRINTF(Commit,"Placing Rename Insts into skidBuffer.\n");
|
|
||||||
|
|
||||||
for (;
|
|
||||||
rename_idx < fromRename->size;
|
|
||||||
rename_idx++) {
|
|
||||||
DynInstPtr inst = fromRename->insts[rename_idx];
|
|
||||||
|
|
||||||
if (!inst->isSquashed()) {
|
|
||||||
DPRINTF(Commit, "Inserting PC %#x [sn:%i] [tid:%i] into ",
|
|
||||||
"skidBuffer.\n", inst->readPC(), inst->seqNum,
|
|
||||||
inst->threadNumber);
|
|
||||||
skidBuffer.push(inst);
|
|
||||||
} else {
|
|
||||||
DPRINTF(Commit, "Instruction PC %#x [sn:%i] [tid:%i] was "
|
|
||||||
"squashed, skipping.\n",
|
|
||||||
inst->readPC(), inst->seqNum, inst->threadNumber);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
|
|
|
@ -696,7 +696,7 @@ FullO3CPU<Impl>::removeThread(unsigned tid)
|
||||||
|
|
||||||
// Squash Throughout Pipeline
|
// Squash Throughout Pipeline
|
||||||
InstSeqNum squash_seq_num = commit.rob->readHeadInst(tid)->seqNum;
|
InstSeqNum squash_seq_num = commit.rob->readHeadInst(tid)->seqNum;
|
||||||
fetch.squash(0, sizeof(TheISA::MachInst), squash_seq_num, true, tid);
|
fetch.squash(0, sizeof(TheISA::MachInst), 0, squash_seq_num, tid);
|
||||||
decode.squash(tid);
|
decode.squash(tid);
|
||||||
rename.squash(squash_seq_num, tid);
|
rename.squash(squash_seq_num, tid);
|
||||||
iew.squash(tid);
|
iew.squash(tid);
|
||||||
|
@ -1150,6 +1150,20 @@ FullO3CPU<Impl>::setPC(Addr new_PC,unsigned tid)
|
||||||
commit.setPC(new_PC, tid);
|
commit.setPC(new_PC, tid);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
template <class Impl>
|
||||||
|
uint64_t
|
||||||
|
FullO3CPU<Impl>::readMicroPC(unsigned tid)
|
||||||
|
{
|
||||||
|
return commit.readMicroPC(tid);
|
||||||
|
}
|
||||||
|
|
||||||
|
template <class Impl>
|
||||||
|
void
|
||||||
|
FullO3CPU<Impl>::setMicroPC(Addr new_PC,unsigned tid)
|
||||||
|
{
|
||||||
|
commit.setMicroPC(new_PC, tid);
|
||||||
|
}
|
||||||
|
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
uint64_t
|
uint64_t
|
||||||
FullO3CPU<Impl>::readNextPC(unsigned tid)
|
FullO3CPU<Impl>::readNextPC(unsigned tid)
|
||||||
|
@ -1178,6 +1192,20 @@ FullO3CPU<Impl>::setNextNPC(uint64_t val,unsigned tid)
|
||||||
commit.setNextNPC(val, tid);
|
commit.setNextNPC(val, tid);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
template <class Impl>
|
||||||
|
uint64_t
|
||||||
|
FullO3CPU<Impl>::readNextMicroPC(unsigned tid)
|
||||||
|
{
|
||||||
|
return commit.readNextMicroPC(tid);
|
||||||
|
}
|
||||||
|
|
||||||
|
template <class Impl>
|
||||||
|
void
|
||||||
|
FullO3CPU<Impl>::setNextMicroPC(Addr new_PC,unsigned tid)
|
||||||
|
{
|
||||||
|
commit.setNextMicroPC(new_PC, tid);
|
||||||
|
}
|
||||||
|
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
typename FullO3CPU<Impl>::ListIt
|
typename FullO3CPU<Impl>::ListIt
|
||||||
FullO3CPU<Impl>::addInst(DynInstPtr &inst)
|
FullO3CPU<Impl>::addInst(DynInstPtr &inst)
|
||||||
|
@ -1226,9 +1254,7 @@ FullO3CPU<Impl>::removeFrontInst(DynInstPtr &inst)
|
||||||
|
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
void
|
void
|
||||||
FullO3CPU<Impl>::removeInstsNotInROB(unsigned tid,
|
FullO3CPU<Impl>::removeInstsNotInROB(unsigned tid)
|
||||||
bool squash_delay_slot,
|
|
||||||
const InstSeqNum &delay_slot_seq_num)
|
|
||||||
{
|
{
|
||||||
DPRINTF(O3CPU, "Thread %i: Deleting instructions from instruction"
|
DPRINTF(O3CPU, "Thread %i: Deleting instructions from instruction"
|
||||||
" list.\n", tid);
|
" list.\n", tid);
|
||||||
|
@ -1259,12 +1285,6 @@ FullO3CPU<Impl>::removeInstsNotInROB(unsigned tid,
|
||||||
while (inst_it != end_it) {
|
while (inst_it != end_it) {
|
||||||
assert(!instList.empty());
|
assert(!instList.empty());
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
if(!squash_delay_slot &&
|
|
||||||
delay_slot_seq_num >= (*inst_it)->seqNum) {
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
squashInstIt(inst_it, tid);
|
squashInstIt(inst_it, tid);
|
||||||
|
|
||||||
inst_it--;
|
inst_it--;
|
||||||
|
|
|
@ -433,22 +433,34 @@ class FullO3CPU : public BaseO3CPU
|
||||||
void setArchFloatRegInt(int reg_idx, uint64_t val, unsigned tid);
|
void setArchFloatRegInt(int reg_idx, uint64_t val, unsigned tid);
|
||||||
|
|
||||||
/** Reads the commit PC of a specific thread. */
|
/** Reads the commit PC of a specific thread. */
|
||||||
uint64_t readPC(unsigned tid);
|
Addr readPC(unsigned tid);
|
||||||
|
|
||||||
/** Sets the commit PC of a specific thread. */
|
/** Sets the commit PC of a specific thread. */
|
||||||
void setPC(Addr new_PC, unsigned tid);
|
void setPC(Addr new_PC, unsigned tid);
|
||||||
|
|
||||||
|
/** Reads the commit micro PC of a specific thread. */
|
||||||
|
Addr readMicroPC(unsigned tid);
|
||||||
|
|
||||||
|
/** Sets the commmit micro PC of a specific thread. */
|
||||||
|
void setMicroPC(Addr new_microPC, unsigned tid);
|
||||||
|
|
||||||
/** Reads the next PC of a specific thread. */
|
/** Reads the next PC of a specific thread. */
|
||||||
uint64_t readNextPC(unsigned tid);
|
Addr readNextPC(unsigned tid);
|
||||||
|
|
||||||
/** Sets the next PC of a specific thread. */
|
/** Sets the next PC of a specific thread. */
|
||||||
void setNextPC(uint64_t val, unsigned tid);
|
void setNextPC(Addr val, unsigned tid);
|
||||||
|
|
||||||
/** Reads the next NPC of a specific thread. */
|
/** Reads the next NPC of a specific thread. */
|
||||||
uint64_t readNextNPC(unsigned tid);
|
Addr readNextNPC(unsigned tid);
|
||||||
|
|
||||||
/** Sets the next NPC of a specific thread. */
|
/** Sets the next NPC of a specific thread. */
|
||||||
void setNextNPC(uint64_t val, unsigned tid);
|
void setNextNPC(Addr val, unsigned tid);
|
||||||
|
|
||||||
|
/** Reads the commit next micro PC of a specific thread. */
|
||||||
|
Addr readNextMicroPC(unsigned tid);
|
||||||
|
|
||||||
|
/** Sets the commit next micro PC of a specific thread. */
|
||||||
|
void setNextMicroPC(Addr val, unsigned tid);
|
||||||
|
|
||||||
/** Function to add instruction onto the head of the list of the
|
/** Function to add instruction onto the head of the list of the
|
||||||
* instructions. Used when new instructions are fetched.
|
* instructions. Used when new instructions are fetched.
|
||||||
|
@ -468,8 +480,7 @@ class FullO3CPU : public BaseO3CPU
|
||||||
|
|
||||||
/** Remove all instructions that are not currently in the ROB.
|
/** Remove all instructions that are not currently in the ROB.
|
||||||
* There's also an option to not squash delay slot instructions.*/
|
* There's also an option to not squash delay slot instructions.*/
|
||||||
void removeInstsNotInROB(unsigned tid, bool squash_delay_slot,
|
void removeInstsNotInROB(unsigned tid);
|
||||||
const InstSeqNum &delay_slot_seq_num);
|
|
||||||
|
|
||||||
/** Remove all instructions younger than the given sequence number. */
|
/** Remove all instructions younger than the given sequence number. */
|
||||||
void removeInstsUntil(const InstSeqNum &seq_num,unsigned tid);
|
void removeInstsUntil(const InstSeqNum &seq_num,unsigned tid);
|
||||||
|
|
|
@ -49,8 +49,6 @@ DefaultDecode<Impl>::DefaultDecode(O3CPU *_cpu, Params *params)
|
||||||
stalls[i].rename = false;
|
stalls[i].rename = false;
|
||||||
stalls[i].iew = false;
|
stalls[i].iew = false;
|
||||||
stalls[i].commit = false;
|
stalls[i].commit = false;
|
||||||
|
|
||||||
squashAfterDelaySlot[i] = false;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// @todo: Make into a parameter
|
// @todo: Make into a parameter
|
||||||
|
@ -275,20 +273,16 @@ DefaultDecode<Impl>::squash(DynInstPtr &inst, unsigned tid)
|
||||||
///explicitly for ISAs with delay slots.
|
///explicitly for ISAs with delay slots.
|
||||||
toFetch->decodeInfo[tid].nextNPC =
|
toFetch->decodeInfo[tid].nextNPC =
|
||||||
inst->branchTarget() + sizeof(TheISA::MachInst);
|
inst->branchTarget() + sizeof(TheISA::MachInst);
|
||||||
|
toFetch->decodeInfo[tid].nextMicroPC = inst->readMicroPC();
|
||||||
#if ISA_HAS_DELAY_SLOT
|
#if ISA_HAS_DELAY_SLOT
|
||||||
toFetch->decodeInfo[tid].branchTaken = inst->readNextNPC() !=
|
toFetch->decodeInfo[tid].branchTaken = inst->readNextNPC() !=
|
||||||
(inst->readNextPC() + sizeof(TheISA::MachInst));
|
(inst->readNextPC() + sizeof(TheISA::MachInst));
|
||||||
|
|
||||||
toFetch->decodeInfo[tid].bdelayDoneSeqNum = bdelayDoneSeqNum[tid];
|
|
||||||
squashAfterDelaySlot[tid] = false;
|
|
||||||
|
|
||||||
InstSeqNum squash_seq_num = bdelayDoneSeqNum[tid];
|
|
||||||
#else
|
#else
|
||||||
toFetch->decodeInfo[tid].branchTaken =
|
toFetch->decodeInfo[tid].branchTaken =
|
||||||
inst->readNextPC() != (inst->readPC() + sizeof(TheISA::MachInst));
|
inst->readNextPC() != (inst->readPC() + sizeof(TheISA::MachInst));
|
||||||
|
#endif
|
||||||
|
|
||||||
InstSeqNum squash_seq_num = inst->seqNum;
|
InstSeqNum squash_seq_num = inst->seqNum;
|
||||||
#endif
|
|
||||||
|
|
||||||
// Might have to tell fetch to unblock.
|
// Might have to tell fetch to unblock.
|
||||||
if (decodeStatus[tid] == Blocked ||
|
if (decodeStatus[tid] == Blocked ||
|
||||||
|
@ -309,30 +303,10 @@ DefaultDecode<Impl>::squash(DynInstPtr &inst, unsigned tid)
|
||||||
// Clear the instruction list and skid buffer in case they have any
|
// Clear the instruction list and skid buffer in case they have any
|
||||||
// insts in them.
|
// insts in them.
|
||||||
while (!insts[tid].empty()) {
|
while (!insts[tid].empty()) {
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
if (insts[tid].front()->seqNum <= squash_seq_num) {
|
|
||||||
DPRINTF(Decode, "[tid:%i]: Cannot remove incoming decode "
|
|
||||||
"instructions before delay slot [sn:%i]. %i insts"
|
|
||||||
"left in decode.\n", tid, squash_seq_num,
|
|
||||||
insts[tid].size());
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
insts[tid].pop();
|
insts[tid].pop();
|
||||||
}
|
}
|
||||||
|
|
||||||
while (!skidBuffer[tid].empty()) {
|
while (!skidBuffer[tid].empty()) {
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
if (skidBuffer[tid].front()->seqNum <= squash_seq_num) {
|
|
||||||
DPRINTF(Decode, "[tid:%i]: Cannot remove skidBuffer "
|
|
||||||
"instructions before delay slot [sn:%i]. %i insts"
|
|
||||||
"left in decode.\n", tid, squash_seq_num,
|
|
||||||
insts[tid].size());
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
skidBuffer[tid].pop();
|
skidBuffer[tid].pop();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -760,47 +734,12 @@ DefaultDecode<Impl>::decodeInsts(unsigned tid)
|
||||||
|
|
||||||
// Might want to set some sort of boolean and just do
|
// Might want to set some sort of boolean and just do
|
||||||
// a check at the end
|
// a check at the end
|
||||||
#if !ISA_HAS_DELAY_SLOT
|
|
||||||
squash(inst, inst->threadNumber);
|
squash(inst, inst->threadNumber);
|
||||||
Addr target = inst->branchTarget();
|
Addr target = inst->branchTarget();
|
||||||
inst->setPredTarg(target, target + sizeof(TheISA::MachInst));
|
//The micro pc after an instruction level branch should be 0
|
||||||
|
inst->setPredTarg(target, target + sizeof(TheISA::MachInst), 0);
|
||||||
break;
|
break;
|
||||||
#else
|
|
||||||
// If mispredicted as taken, then ignore delay slot
|
|
||||||
// instruction... else keep delay slot and squash
|
|
||||||
// after it is sent to rename
|
|
||||||
if (inst->readPredTaken() && inst->isCondDelaySlot()) {
|
|
||||||
DPRINTF(Decode, "[tid:%i]: Conditional delay slot inst."
|
|
||||||
"[sn:%i] PC %#x mispredicted as taken.\n", tid,
|
|
||||||
inst->seqNum, inst->PC);
|
|
||||||
bdelayDoneSeqNum[tid] = inst->seqNum;
|
|
||||||
squash(inst, inst->threadNumber);
|
|
||||||
Addr target = inst->branchTarget();
|
|
||||||
inst->setPredTarg(target,
|
|
||||||
target + sizeof(TheISA::MachInst));
|
|
||||||
break;
|
|
||||||
} else {
|
|
||||||
DPRINTF(Decode, "[tid:%i]: Misprediction detected at "
|
|
||||||
"[sn:%i] PC %#x, will squash after delay slot "
|
|
||||||
"inst. is sent to Rename\n",
|
|
||||||
tid, inst->seqNum, inst->PC);
|
|
||||||
bdelayDoneSeqNum[tid] = inst->seqNum + 1;
|
|
||||||
squashAfterDelaySlot[tid] = true;
|
|
||||||
squashInst[tid] = inst;
|
|
||||||
continue;
|
|
||||||
}
|
}
|
||||||
#endif
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
if (squashAfterDelaySlot[tid]) {
|
|
||||||
assert(!inst->isSquashed());
|
|
||||||
squash(squashInst[tid], squashInst[tid]->threadNumber);
|
|
||||||
Addr target = squashInst[tid]->branchTarget();
|
|
||||||
squashInst[tid]->setPredTarg(target,
|
|
||||||
target + sizeof(TheISA::MachInst));
|
|
||||||
assert(!inst->isSquashed());
|
|
||||||
break;
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -227,7 +227,7 @@ class DefaultFetch
|
||||||
* @param next_NPC Used for ISAs which use delay slots.
|
* @param next_NPC Used for ISAs which use delay slots.
|
||||||
* @return Whether or not a branch was predicted as taken.
|
* @return Whether or not a branch was predicted as taken.
|
||||||
*/
|
*/
|
||||||
bool lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC, Addr &next_NPC);
|
bool lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC, Addr &next_NPC, Addr &next_MicroPC);
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Fetches the cache line that contains fetch_PC. Returns any
|
* Fetches the cache line that contains fetch_PC. Returns any
|
||||||
|
@ -242,12 +242,14 @@ class DefaultFetch
|
||||||
bool fetchCacheLine(Addr fetch_PC, Fault &ret_fault, unsigned tid);
|
bool fetchCacheLine(Addr fetch_PC, Fault &ret_fault, unsigned tid);
|
||||||
|
|
||||||
/** Squashes a specific thread and resets the PC. */
|
/** Squashes a specific thread and resets the PC. */
|
||||||
inline void doSquash(const Addr &new_PC, const Addr &new_NPC, unsigned tid);
|
inline void doSquash(const Addr &new_PC, const Addr &new_NPC,
|
||||||
|
const Addr &new_MicroPC, unsigned tid);
|
||||||
|
|
||||||
/** Squashes a specific thread and resets the PC. Also tells the CPU to
|
/** Squashes a specific thread and resets the PC. Also tells the CPU to
|
||||||
* remove any instructions between fetch and decode that should be sqaushed.
|
* remove any instructions between fetch and decode that should be sqaushed.
|
||||||
*/
|
*/
|
||||||
void squashFromDecode(const Addr &new_PC, const Addr &new_NPC,
|
void squashFromDecode(const Addr &new_PC, const Addr &new_NPC,
|
||||||
|
const Addr &new_MicroPC,
|
||||||
const InstSeqNum &seq_num, unsigned tid);
|
const InstSeqNum &seq_num, unsigned tid);
|
||||||
|
|
||||||
/** Checks if a thread is stalled. */
|
/** Checks if a thread is stalled. */
|
||||||
|
@ -263,8 +265,8 @@ class DefaultFetch
|
||||||
* squash should be the commit stage.
|
* squash should be the commit stage.
|
||||||
*/
|
*/
|
||||||
void squash(const Addr &new_PC, const Addr &new_NPC,
|
void squash(const Addr &new_PC, const Addr &new_NPC,
|
||||||
const InstSeqNum &seq_num,
|
const Addr &new_MicroPC,
|
||||||
bool squash_delay_slot, unsigned tid);
|
const InstSeqNum &seq_num, unsigned tid);
|
||||||
|
|
||||||
/** Ticks the fetch stage, processing all inputs signals and fetching
|
/** Ticks the fetch stage, processing all inputs signals and fetching
|
||||||
* as many instructions as possible.
|
* as many instructions as possible.
|
||||||
|
@ -347,16 +349,12 @@ class DefaultFetch
|
||||||
/** Per-thread fetch PC. */
|
/** Per-thread fetch PC. */
|
||||||
Addr PC[Impl::MaxThreads];
|
Addr PC[Impl::MaxThreads];
|
||||||
|
|
||||||
|
/** Per-thread fetch micro PC. */
|
||||||
|
Addr microPC[Impl::MaxThreads];
|
||||||
|
|
||||||
/** Per-thread next PC. */
|
/** Per-thread next PC. */
|
||||||
Addr nextPC[Impl::MaxThreads];
|
Addr nextPC[Impl::MaxThreads];
|
||||||
|
|
||||||
/** Per-thread next Next PC.
|
|
||||||
* This is not a real register but is used for
|
|
||||||
* architectures that use a branch-delay slot.
|
|
||||||
* (such as MIPS or Sparc)
|
|
||||||
*/
|
|
||||||
Addr nextNPC[Impl::MaxThreads];
|
|
||||||
|
|
||||||
/** Memory request used to access cache. */
|
/** Memory request used to access cache. */
|
||||||
RequestPtr memReq[Impl::MaxThreads];
|
RequestPtr memReq[Impl::MaxThreads];
|
||||||
|
|
||||||
|
|
|
@ -312,7 +312,7 @@ DefaultFetch<Impl>::initStage()
|
||||||
for (int tid = 0; tid < numThreads; tid++) {
|
for (int tid = 0; tid < numThreads; tid++) {
|
||||||
PC[tid] = cpu->readPC(tid);
|
PC[tid] = cpu->readPC(tid);
|
||||||
nextPC[tid] = cpu->readNextPC(tid);
|
nextPC[tid] = cpu->readNextPC(tid);
|
||||||
nextNPC[tid] = cpu->readNextNPC(tid);
|
microPC[tid] = cpu->readMicroPC(tid);
|
||||||
}
|
}
|
||||||
|
|
||||||
for (int tid=0; tid < numThreads; tid++) {
|
for (int tid=0; tid < numThreads; tid++) {
|
||||||
|
@ -439,11 +439,7 @@ DefaultFetch<Impl>::takeOverFrom()
|
||||||
stalls[i].commit = 0;
|
stalls[i].commit = 0;
|
||||||
PC[i] = cpu->readPC(i);
|
PC[i] = cpu->readPC(i);
|
||||||
nextPC[i] = cpu->readNextPC(i);
|
nextPC[i] = cpu->readNextPC(i);
|
||||||
#if ISA_HAS_DELAY_SLOT
|
microPC[i] = cpu->readMicroPC(i);
|
||||||
nextNPC[i] = cpu->readNextNPC(i);
|
|
||||||
#else
|
|
||||||
nextNPC[i] = nextPC[i] + sizeof(TheISA::MachInst);
|
|
||||||
#endif
|
|
||||||
fetchStatus[i] = Running;
|
fetchStatus[i] = Running;
|
||||||
}
|
}
|
||||||
numInst = 0;
|
numInst = 0;
|
||||||
|
@ -493,7 +489,7 @@ DefaultFetch<Impl>::switchToInactive()
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
bool
|
bool
|
||||||
DefaultFetch<Impl>::lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC,
|
DefaultFetch<Impl>::lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC,
|
||||||
Addr &next_NPC)
|
Addr &next_NPC, Addr &next_MicroPC)
|
||||||
{
|
{
|
||||||
// Do branch prediction check here.
|
// Do branch prediction check here.
|
||||||
// A bit of a misnomer...next_PC is actually the current PC until
|
// A bit of a misnomer...next_PC is actually the current PC until
|
||||||
|
@ -501,13 +497,22 @@ DefaultFetch<Impl>::lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC,
|
||||||
bool predict_taken;
|
bool predict_taken;
|
||||||
|
|
||||||
if (!inst->isControl()) {
|
if (!inst->isControl()) {
|
||||||
|
if (inst->isMicroOp() && !inst->isLastMicroOp()) {
|
||||||
|
next_MicroPC++;
|
||||||
|
} else {
|
||||||
next_PC = next_NPC;
|
next_PC = next_NPC;
|
||||||
next_NPC = next_NPC + instSize;
|
next_NPC = next_NPC + instSize;
|
||||||
inst->setPredTarg(next_PC, next_NPC);
|
next_MicroPC = 0;
|
||||||
|
}
|
||||||
|
inst->setPredTarg(next_PC, next_NPC, next_MicroPC);
|
||||||
inst->setPredTaken(false);
|
inst->setPredTaken(false);
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
//Assume for now that all control flow is to a different macroop which
|
||||||
|
//would reset the micro pc to 0.
|
||||||
|
next_MicroPC = 0;
|
||||||
|
|
||||||
int tid = inst->threadNumber;
|
int tid = inst->threadNumber;
|
||||||
Addr pred_PC = next_PC;
|
Addr pred_PC = next_PC;
|
||||||
predict_taken = branchPred.predict(inst, pred_PC, tid);
|
predict_taken = branchPred.predict(inst, pred_PC, tid);
|
||||||
|
@ -534,7 +539,7 @@ DefaultFetch<Impl>::lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC,
|
||||||
#endif
|
#endif
|
||||||
/* DPRINTF(Fetch, "[tid:%i]: Branch predicted to go to %#x and then %#x.\n",
|
/* DPRINTF(Fetch, "[tid:%i]: Branch predicted to go to %#x and then %#x.\n",
|
||||||
tid, next_PC, next_NPC);*/
|
tid, next_PC, next_NPC);*/
|
||||||
inst->setPredTarg(next_PC, next_NPC);
|
inst->setPredTarg(next_PC, next_NPC, next_MicroPC);
|
||||||
inst->setPredTaken(predict_taken);
|
inst->setPredTaken(predict_taken);
|
||||||
|
|
||||||
++fetchedBranches;
|
++fetchedBranches;
|
||||||
|
@ -658,14 +663,14 @@ DefaultFetch<Impl>::fetchCacheLine(Addr fetch_PC, Fault &ret_fault, unsigned tid
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
inline void
|
inline void
|
||||||
DefaultFetch<Impl>::doSquash(const Addr &new_PC,
|
DefaultFetch<Impl>::doSquash(const Addr &new_PC,
|
||||||
const Addr &new_NPC, unsigned tid)
|
const Addr &new_NPC, const Addr &new_microPC, unsigned tid)
|
||||||
{
|
{
|
||||||
DPRINTF(Fetch, "[tid:%i]: Squashing, setting PC to: %#x, NPC to: %#x.\n",
|
DPRINTF(Fetch, "[tid:%i]: Squashing, setting PC to: %#x, NPC to: %#x.\n",
|
||||||
tid, new_PC, new_NPC);
|
tid, new_PC, new_NPC);
|
||||||
|
|
||||||
PC[tid] = new_PC;
|
PC[tid] = new_PC;
|
||||||
nextPC[tid] = new_NPC;
|
nextPC[tid] = new_NPC;
|
||||||
nextNPC[tid] = new_NPC + instSize;
|
microPC[tid] = new_microPC;
|
||||||
|
|
||||||
// Clear the icache miss if it's outstanding.
|
// Clear the icache miss if it's outstanding.
|
||||||
if (fetchStatus[tid] == IcacheWaitResponse) {
|
if (fetchStatus[tid] == IcacheWaitResponse) {
|
||||||
|
@ -693,12 +698,12 @@ DefaultFetch<Impl>::doSquash(const Addr &new_PC,
|
||||||
template<class Impl>
|
template<class Impl>
|
||||||
void
|
void
|
||||||
DefaultFetch<Impl>::squashFromDecode(const Addr &new_PC, const Addr &new_NPC,
|
DefaultFetch<Impl>::squashFromDecode(const Addr &new_PC, const Addr &new_NPC,
|
||||||
const InstSeqNum &seq_num,
|
const Addr &new_MicroPC,
|
||||||
unsigned tid)
|
const InstSeqNum &seq_num, unsigned tid)
|
||||||
{
|
{
|
||||||
DPRINTF(Fetch, "[tid:%i]: Squashing from decode.\n",tid);
|
DPRINTF(Fetch, "[tid:%i]: Squashing from decode.\n",tid);
|
||||||
|
|
||||||
doSquash(new_PC, new_NPC, tid);
|
doSquash(new_PC, new_NPC, new_MicroPC, tid);
|
||||||
|
|
||||||
// Tell the CPU to remove any instructions that are in flight between
|
// Tell the CPU to remove any instructions that are in flight between
|
||||||
// fetch and decode.
|
// fetch and decode.
|
||||||
|
@ -774,20 +779,15 @@ DefaultFetch<Impl>::updateFetchStatus()
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
void
|
void
|
||||||
DefaultFetch<Impl>::squash(const Addr &new_PC, const Addr &new_NPC,
|
DefaultFetch<Impl>::squash(const Addr &new_PC, const Addr &new_NPC,
|
||||||
const InstSeqNum &seq_num,
|
const Addr &new_MicroPC,
|
||||||
bool squash_delay_slot, unsigned tid)
|
const InstSeqNum &seq_num, unsigned tid)
|
||||||
{
|
{
|
||||||
DPRINTF(Fetch, "[tid:%u]: Squash from commit.\n",tid);
|
DPRINTF(Fetch, "[tid:%u]: Squash from commit.\n",tid);
|
||||||
|
|
||||||
doSquash(new_PC, new_NPC, tid);
|
doSquash(new_PC, new_NPC, new_MicroPC, tid);
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
// Tell the CPU to remove any instructions that are not in the ROB.
|
// Tell the CPU to remove any instructions that are not in the ROB.
|
||||||
cpu->removeInstsNotInROB(tid, squash_delay_slot, seq_num);
|
cpu->removeInstsNotInROB(tid);
|
||||||
#else
|
|
||||||
// Tell the CPU to remove any instructions that are not in the ROB.
|
|
||||||
cpu->removeInstsNotInROB(tid, true, 0);
|
|
||||||
#endif
|
|
||||||
}
|
}
|
||||||
|
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
|
@ -896,17 +896,11 @@ DefaultFetch<Impl>::checkSignalsAndUpdate(unsigned tid)
|
||||||
|
|
||||||
DPRINTF(Fetch, "[tid:%u]: Squashing instructions due to squash "
|
DPRINTF(Fetch, "[tid:%u]: Squashing instructions due to squash "
|
||||||
"from commit.\n",tid);
|
"from commit.\n",tid);
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
InstSeqNum doneSeqNum = fromCommit->commitInfo[tid].bdelayDoneSeqNum;
|
|
||||||
#else
|
|
||||||
InstSeqNum doneSeqNum = fromCommit->commitInfo[tid].doneSeqNum;
|
|
||||||
#endif
|
|
||||||
// In any case, squash.
|
// In any case, squash.
|
||||||
squash(fromCommit->commitInfo[tid].nextPC,
|
squash(fromCommit->commitInfo[tid].nextPC,
|
||||||
fromCommit->commitInfo[tid].nextNPC,
|
fromCommit->commitInfo[tid].nextNPC,
|
||||||
doneSeqNum,
|
fromCommit->commitInfo[tid].nextMicroPC,
|
||||||
fromCommit->commitInfo[tid].squashDelaySlot,
|
fromCommit->commitInfo[tid].doneSeqNum,
|
||||||
tid);
|
tid);
|
||||||
|
|
||||||
// Also check if there's a mispredict that happened.
|
// Also check if there's a mispredict that happened.
|
||||||
|
@ -955,18 +949,14 @@ DefaultFetch<Impl>::checkSignalsAndUpdate(unsigned tid)
|
||||||
|
|
||||||
if (fetchStatus[tid] != Squashing) {
|
if (fetchStatus[tid] != Squashing) {
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
InstSeqNum doneSeqNum = fromDecode->decodeInfo[tid].bdelayDoneSeqNum;
|
|
||||||
#else
|
|
||||||
InstSeqNum doneSeqNum = fromDecode->decodeInfo[tid].doneSeqNum;
|
|
||||||
#endif
|
|
||||||
DPRINTF(Fetch, "Squashing from decode with PC = %#x, NPC = %#x\n",
|
DPRINTF(Fetch, "Squashing from decode with PC = %#x, NPC = %#x\n",
|
||||||
fromDecode->decodeInfo[tid].nextPC,
|
fromDecode->decodeInfo[tid].nextPC,
|
||||||
fromDecode->decodeInfo[tid].nextNPC);
|
fromDecode->decodeInfo[tid].nextNPC);
|
||||||
// Squash unless we're already squashing
|
// Squash unless we're already squashing
|
||||||
squashFromDecode(fromDecode->decodeInfo[tid].nextPC,
|
squashFromDecode(fromDecode->decodeInfo[tid].nextPC,
|
||||||
fromDecode->decodeInfo[tid].nextNPC,
|
fromDecode->decodeInfo[tid].nextNPC,
|
||||||
doneSeqNum,
|
fromDecode->decodeInfo[tid].nextMicroPC,
|
||||||
|
fromDecode->decodeInfo[tid].doneSeqNum,
|
||||||
tid);
|
tid);
|
||||||
|
|
||||||
return true;
|
return true;
|
||||||
|
@ -1020,9 +1010,9 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
DPRINTF(Fetch, "Attempting to fetch from [tid:%i]\n", tid);
|
DPRINTF(Fetch, "Attempting to fetch from [tid:%i]\n", tid);
|
||||||
|
|
||||||
// The current PC.
|
// The current PC.
|
||||||
Addr &fetch_PC = PC[tid];
|
Addr fetch_PC = PC[tid];
|
||||||
|
Addr fetch_NPC = nextPC[tid];
|
||||||
Addr &fetch_NPC = nextPC[tid];
|
Addr fetch_MicroPC = microPC[tid];
|
||||||
|
|
||||||
// Fault code for memory access.
|
// Fault code for memory access.
|
||||||
Fault fault = NoFault;
|
Fault fault = NoFault;
|
||||||
|
@ -1081,6 +1071,7 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
|
|
||||||
Addr next_PC = fetch_PC;
|
Addr next_PC = fetch_PC;
|
||||||
Addr next_NPC = fetch_NPC;
|
Addr next_NPC = fetch_NPC;
|
||||||
|
Addr next_MicroPC = fetch_MicroPC;
|
||||||
|
|
||||||
InstSeqNum inst_seq;
|
InstSeqNum inst_seq;
|
||||||
MachInst inst;
|
MachInst inst;
|
||||||
|
@ -1088,6 +1079,9 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
// @todo: Fix this hack.
|
// @todo: Fix this hack.
|
||||||
unsigned offset = (fetch_PC & cacheBlkMask) & ~3;
|
unsigned offset = (fetch_PC & cacheBlkMask) & ~3;
|
||||||
|
|
||||||
|
StaticInstPtr staticInst = NULL;
|
||||||
|
StaticInstPtr macroop = NULL;
|
||||||
|
|
||||||
if (fault == NoFault) {
|
if (fault == NoFault) {
|
||||||
// If the read of the first instruction was successful, then grab the
|
// If the read of the first instruction was successful, then grab the
|
||||||
// instructions from the rest of the cache line and put them into the
|
// instructions from the rest of the cache line and put them into the
|
||||||
|
@ -1100,11 +1094,9 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
// ended this fetch block.
|
// ended this fetch block.
|
||||||
bool predicted_branch = false;
|
bool predicted_branch = false;
|
||||||
|
|
||||||
for (;
|
while (offset < cacheBlkSize &&
|
||||||
offset < cacheBlkSize &&
|
|
||||||
numInst < fetchWidth &&
|
numInst < fetchWidth &&
|
||||||
!predicted_branch;
|
!predicted_branch) {
|
||||||
++numInst) {
|
|
||||||
|
|
||||||
// If we're branching after this instruction, quite fetching
|
// If we're branching after this instruction, quite fetching
|
||||||
// from the same block then.
|
// from the same block then.
|
||||||
|
@ -1115,13 +1107,10 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
fetch_PC, fetch_NPC);
|
fetch_PC, fetch_NPC);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
// Get a sequence number.
|
|
||||||
inst_seq = cpu->getAndIncrementInstSeq();
|
|
||||||
|
|
||||||
// Make sure this is a valid index.
|
// Make sure this is a valid index.
|
||||||
assert(offset <= cacheBlkSize - instSize);
|
assert(offset <= cacheBlkSize - instSize);
|
||||||
|
|
||||||
|
if (!macroop) {
|
||||||
// Get the instruction from the array of the cache line.
|
// Get the instruction from the array of the cache line.
|
||||||
inst = TheISA::gtoh(*reinterpret_cast<TheISA::MachInst *>
|
inst = TheISA::gtoh(*reinterpret_cast<TheISA::MachInst *>
|
||||||
(&cacheData[tid][offset]));
|
(&cacheData[tid][offset]));
|
||||||
|
@ -1130,11 +1119,24 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
predecoder.moreBytes(fetch_PC, 0, inst);
|
predecoder.moreBytes(fetch_PC, 0, inst);
|
||||||
|
|
||||||
ext_inst = predecoder.getExtMachInst();
|
ext_inst = predecoder.getExtMachInst();
|
||||||
|
staticInst = StaticInstPtr(ext_inst);
|
||||||
|
if (staticInst->isMacroOp())
|
||||||
|
macroop = staticInst;
|
||||||
|
}
|
||||||
|
do {
|
||||||
|
if (macroop) {
|
||||||
|
staticInst = macroop->fetchMicroOp(fetch_MicroPC);
|
||||||
|
if (staticInst->isLastMicroOp())
|
||||||
|
macroop = NULL;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Get a sequence number.
|
||||||
|
inst_seq = cpu->getAndIncrementInstSeq();
|
||||||
|
|
||||||
// Create a new DynInst from the instruction fetched.
|
// Create a new DynInst from the instruction fetched.
|
||||||
DynInstPtr instruction = new DynInst(ext_inst,
|
DynInstPtr instruction = new DynInst(staticInst,
|
||||||
fetch_PC, fetch_NPC,
|
fetch_PC, fetch_NPC, fetch_MicroPC,
|
||||||
next_PC, next_NPC,
|
next_PC, next_NPC, next_MicroPC,
|
||||||
inst_seq, cpu);
|
inst_seq, cpu);
|
||||||
instruction->setTid(tid);
|
instruction->setTid(tid);
|
||||||
|
|
||||||
|
@ -1157,11 +1159,8 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
instruction->readPC());
|
instruction->readPC());
|
||||||
|
|
||||||
///FIXME This needs to be more robust in dealing with delay slots
|
///FIXME This needs to be more robust in dealing with delay slots
|
||||||
#if !ISA_HAS_DELAY_SLOT
|
predicted_branch |=
|
||||||
// predicted_branch |=
|
lookupAndUpdateNextPC(instruction, next_PC, next_NPC, next_MicroPC);
|
||||||
#endif
|
|
||||||
lookupAndUpdateNextPC(instruction, next_PC, next_NPC);
|
|
||||||
predicted_branch |= (next_PC != fetch_NPC);
|
|
||||||
|
|
||||||
// Add instruction to the CPU's list of instructions.
|
// Add instruction to the CPU's list of instructions.
|
||||||
instruction->setInstListIt(cpu->addInst(instruction));
|
instruction->setInstListIt(cpu->addInst(instruction));
|
||||||
|
@ -1178,6 +1177,7 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
// Move to the next instruction, unless we have a branch.
|
// Move to the next instruction, unless we have a branch.
|
||||||
fetch_PC = next_PC;
|
fetch_PC = next_PC;
|
||||||
fetch_NPC = next_NPC;
|
fetch_NPC = next_NPC;
|
||||||
|
fetch_MicroPC = next_MicroPC;
|
||||||
|
|
||||||
if (instruction->isQuiesce()) {
|
if (instruction->isQuiesce()) {
|
||||||
DPRINTF(Fetch, "Quiesce instruction encountered, halting fetch!",
|
DPRINTF(Fetch, "Quiesce instruction encountered, halting fetch!",
|
||||||
|
@ -1188,18 +1188,22 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
++numInst;
|
||||||
|
} while (staticInst->isMicroOp() &&
|
||||||
|
!staticInst->isLastMicroOp() &&
|
||||||
|
numInst < fetchWidth);
|
||||||
offset += instSize;
|
offset += instSize;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (offset >= cacheBlkSize) {
|
if (predicted_branch) {
|
||||||
DPRINTF(Fetch, "[tid:%i]: Done fetching, reached the end of cache "
|
DPRINTF(Fetch, "[tid:%i]: Done fetching, predicted branch "
|
||||||
"block.\n", tid);
|
"instruction encountered.\n", tid);
|
||||||
} else if (numInst >= fetchWidth) {
|
} else if (numInst >= fetchWidth) {
|
||||||
DPRINTF(Fetch, "[tid:%i]: Done fetching, reached fetch bandwidth "
|
DPRINTF(Fetch, "[tid:%i]: Done fetching, reached fetch bandwidth "
|
||||||
"for this cycle.\n", tid);
|
"for this cycle.\n", tid);
|
||||||
} else if (predicted_branch) {
|
} else if (offset >= cacheBlkSize) {
|
||||||
DPRINTF(Fetch, "[tid:%i]: Done fetching, predicted branch "
|
DPRINTF(Fetch, "[tid:%i]: Done fetching, reached the end of cache "
|
||||||
"instruction encountered.\n", tid);
|
"block.\n", tid);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1212,12 +1216,8 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
if (fault == NoFault) {
|
if (fault == NoFault) {
|
||||||
PC[tid] = next_PC;
|
PC[tid] = next_PC;
|
||||||
nextPC[tid] = next_NPC;
|
nextPC[tid] = next_NPC;
|
||||||
nextNPC[tid] = next_NPC + instSize;
|
microPC[tid] = next_MicroPC;
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
DPRINTF(Fetch, "[tid:%i]: Setting PC to %08p.\n", tid, PC[tid]);
|
|
||||||
#else
|
|
||||||
DPRINTF(Fetch, "[tid:%i]: Setting PC to %08p.\n", tid, next_PC);
|
DPRINTF(Fetch, "[tid:%i]: Setting PC to %08p.\n", tid, next_PC);
|
||||||
#endif
|
|
||||||
} else {
|
} else {
|
||||||
// We shouldn't be in an icache miss and also have a fault (an ITB
|
// We shouldn't be in an icache miss and also have a fault (an ITB
|
||||||
// miss)
|
// miss)
|
||||||
|
@ -1235,8 +1235,9 @@ DefaultFetch<Impl>::fetch(bool &status_change)
|
||||||
// We will use a nop in order to carry the fault.
|
// We will use a nop in order to carry the fault.
|
||||||
ext_inst = TheISA::NoopMachInst;
|
ext_inst = TheISA::NoopMachInst;
|
||||||
|
|
||||||
|
StaticInstPtr staticInst = new StaticInst(ext_inst);
|
||||||
// Create a new DynInst from the dummy nop.
|
// Create a new DynInst from the dummy nop.
|
||||||
DynInstPtr instruction = new DynInst(ext_inst,
|
DynInstPtr instruction = new DynInst(staticInst,
|
||||||
fetch_PC, fetch_NPC,
|
fetch_PC, fetch_NPC,
|
||||||
next_PC, next_NPC,
|
next_PC, next_NPC,
|
||||||
inst_seq, cpu);
|
inst_seq, cpu);
|
||||||
|
|
|
@ -168,7 +168,9 @@ SimpleFreeList::addReg(PhysRegIndex freed_reg)
|
||||||
if (freed_reg != TheISA::ZeroReg)
|
if (freed_reg != TheISA::ZeroReg)
|
||||||
freeIntRegs.push(freed_reg);
|
freeIntRegs.push(freed_reg);
|
||||||
} else if (freed_reg < numPhysicalRegs) {
|
} else if (freed_reg < numPhysicalRegs) {
|
||||||
|
#if THE_ISA == ALPHA_ISA
|
||||||
if (freed_reg != (TheISA::ZeroReg + numPhysicalIntRegs))
|
if (freed_reg != (TheISA::ZeroReg + numPhysicalIntRegs))
|
||||||
|
#endif
|
||||||
freeFloatRegs.push(freed_reg);
|
freeFloatRegs.push(freed_reg);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -402,9 +402,6 @@ class DefaultIEW
|
||||||
/** Records if there is a fetch redirect on this cycle for each thread. */
|
/** Records if there is a fetch redirect on this cycle for each thread. */
|
||||||
bool fetchRedirect[Impl::MaxThreads];
|
bool fetchRedirect[Impl::MaxThreads];
|
||||||
|
|
||||||
/** Keeps track of the last valid branch delay slot instss for threads */
|
|
||||||
InstSeqNum bdelayDoneSeqNum[Impl::MaxThreads];
|
|
||||||
|
|
||||||
/** Used to track if all instructions have been dispatched this cycle.
|
/** Used to track if all instructions have been dispatched this cycle.
|
||||||
* If they have not, then blocking must have occurred, and the instructions
|
* If they have not, then blocking must have occurred, and the instructions
|
||||||
* would already be added to the skid buffer.
|
* would already be added to the skid buffer.
|
||||||
|
|
|
@ -69,7 +69,6 @@ DefaultIEW<Impl>::DefaultIEW(O3CPU *_cpu, Params *params)
|
||||||
dispatchStatus[i] = Running;
|
dispatchStatus[i] = Running;
|
||||||
stalls[i].commit = false;
|
stalls[i].commit = false;
|
||||||
fetchRedirect[i] = false;
|
fetchRedirect[i] = false;
|
||||||
bdelayDoneSeqNum[i] = 0;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
wbMax = wbWidth * params->wbDepth;
|
wbMax = wbWidth * params->wbDepth;
|
||||||
|
@ -410,31 +409,14 @@ DefaultIEW<Impl>::squash(unsigned tid)
|
||||||
instQueue.squash(tid);
|
instQueue.squash(tid);
|
||||||
|
|
||||||
// Tell the LDSTQ to start squashing.
|
// Tell the LDSTQ to start squashing.
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
ldstQueue.squash(fromCommit->commitInfo[tid].bdelayDoneSeqNum, tid);
|
|
||||||
#else
|
|
||||||
ldstQueue.squash(fromCommit->commitInfo[tid].doneSeqNum, tid);
|
ldstQueue.squash(fromCommit->commitInfo[tid].doneSeqNum, tid);
|
||||||
#endif
|
|
||||||
updatedQueues = true;
|
updatedQueues = true;
|
||||||
|
|
||||||
// Clear the skid buffer in case it has any data in it.
|
// Clear the skid buffer in case it has any data in it.
|
||||||
DPRINTF(IEW, "[tid:%i]: Removing skidbuffer instructions until [sn:%i].\n",
|
DPRINTF(IEW, "[tid:%i]: Removing skidbuffer instructions until [sn:%i].\n",
|
||||||
tid, fromCommit->commitInfo[tid].bdelayDoneSeqNum);
|
tid, fromCommit->commitInfo[tid].doneSeqNum);
|
||||||
|
|
||||||
while (!skidBuffer[tid].empty()) {
|
while (!skidBuffer[tid].empty()) {
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
if (skidBuffer[tid].front()->seqNum <=
|
|
||||||
fromCommit->commitInfo[tid].bdelayDoneSeqNum) {
|
|
||||||
DPRINTF(IEW, "[tid:%i]: Cannot remove skidbuffer instructions "
|
|
||||||
"that occur before delay slot [sn:%i].\n",
|
|
||||||
fromCommit->commitInfo[tid].bdelayDoneSeqNum,
|
|
||||||
tid);
|
|
||||||
break;
|
|
||||||
} else {
|
|
||||||
DPRINTF(IEW, "[tid:%i]: Removing instruction [sn:%i] from "
|
|
||||||
"skidBuffer.\n", tid, skidBuffer[tid].front()->seqNum);
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
if (skidBuffer[tid].front()->isLoad() ||
|
if (skidBuffer[tid].front()->isLoad() ||
|
||||||
skidBuffer[tid].front()->isStore() ) {
|
skidBuffer[tid].front()->isStore() ) {
|
||||||
toRename->iewInfo[tid].dispatchedToLSQ++;
|
toRename->iewInfo[tid].dispatchedToLSQ++;
|
||||||
|
@ -445,8 +427,6 @@ DefaultIEW<Impl>::squash(unsigned tid)
|
||||||
skidBuffer[tid].pop();
|
skidBuffer[tid].pop();
|
||||||
}
|
}
|
||||||
|
|
||||||
bdelayDoneSeqNum[tid] = fromCommit->commitInfo[tid].bdelayDoneSeqNum;
|
|
||||||
|
|
||||||
emptyRenameInsts(tid);
|
emptyRenameInsts(tid);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -462,38 +442,19 @@ DefaultIEW<Impl>::squashDueToBranch(DynInstPtr &inst, unsigned tid)
|
||||||
toCommit->mispredPC[tid] = inst->readPC();
|
toCommit->mispredPC[tid] = inst->readPC();
|
||||||
toCommit->branchMispredict[tid] = true;
|
toCommit->branchMispredict[tid] = true;
|
||||||
|
|
||||||
int instSize = sizeof(TheISA::MachInst);
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
#if ISA_HAS_DELAY_SLOT
|
||||||
bool branch_taken =
|
int instSize = sizeof(TheISA::MachInst);
|
||||||
|
toCommit->branchTaken[tid] =
|
||||||
!(inst->readNextPC() + instSize == inst->readNextNPC() &&
|
!(inst->readNextPC() + instSize == inst->readNextNPC() &&
|
||||||
(inst->readNextPC() == inst->readPC() + instSize ||
|
(inst->readNextPC() == inst->readPC() + instSize ||
|
||||||
inst->readNextPC() == inst->readPC() + 2 * instSize));
|
inst->readNextPC() == inst->readPC() + 2 * instSize));
|
||||||
DPRINTF(Sparc, "Branch taken = %s [sn:%i]\n",
|
|
||||||
branch_taken ? "true": "false", inst->seqNum);
|
|
||||||
|
|
||||||
toCommit->branchTaken[tid] = branch_taken;
|
|
||||||
|
|
||||||
bool squashDelaySlot = true;
|
|
||||||
// (inst->readNextPC() != inst->readPC() + sizeof(TheISA::MachInst));
|
|
||||||
DPRINTF(Sparc, "Squash delay slot = %s [sn:%i]\n",
|
|
||||||
squashDelaySlot ? "true": "false", inst->seqNum);
|
|
||||||
toCommit->squashDelaySlot[tid] = squashDelaySlot;
|
|
||||||
//If we're squashing the delay slot, we need to pick back up at NextPC.
|
|
||||||
//Otherwise, NextPC isn't being squashed, so we should pick back up at
|
|
||||||
//NextNPC.
|
|
||||||
if (squashDelaySlot) {
|
|
||||||
toCommit->nextPC[tid] = inst->readNextPC();
|
|
||||||
toCommit->nextNPC[tid] = inst->readNextNPC();
|
|
||||||
} else {
|
|
||||||
toCommit->nextPC[tid] = inst->readNextNPC();
|
|
||||||
toCommit->nextNPC[tid] = inst->readNextNPC() + instSize;
|
|
||||||
}
|
|
||||||
#else
|
#else
|
||||||
toCommit->branchTaken[tid] = inst->readNextPC() !=
|
toCommit->branchTaken[tid] = inst->readNextPC() !=
|
||||||
(inst->readPC() + sizeof(TheISA::MachInst));
|
(inst->readPC() + sizeof(TheISA::MachInst));
|
||||||
toCommit->nextPC[tid] = inst->readNextPC();
|
|
||||||
toCommit->nextNPC[tid] = inst->readNextPC() + instSize;
|
|
||||||
#endif
|
#endif
|
||||||
|
toCommit->nextPC[tid] = inst->readNextPC();
|
||||||
|
toCommit->nextNPC[tid] = inst->readNextNPC();
|
||||||
|
toCommit->nextMicroPC[tid] = inst->readNextMicroPC();
|
||||||
|
|
||||||
toCommit->includeSquashInst[tid] = false;
|
toCommit->includeSquashInst[tid] = false;
|
||||||
|
|
||||||
|
@ -510,11 +471,7 @@ DefaultIEW<Impl>::squashDueToMemOrder(DynInstPtr &inst, unsigned tid)
|
||||||
toCommit->squash[tid] = true;
|
toCommit->squash[tid] = true;
|
||||||
toCommit->squashedSeqNum[tid] = inst->seqNum;
|
toCommit->squashedSeqNum[tid] = inst->seqNum;
|
||||||
toCommit->nextPC[tid] = inst->readNextPC();
|
toCommit->nextPC[tid] = inst->readNextPC();
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
toCommit->nextNPC[tid] = inst->readNextNPC();
|
toCommit->nextNPC[tid] = inst->readNextNPC();
|
||||||
#else
|
|
||||||
toCommit->nextNPC[tid] = inst->readNextPC() + sizeof(TheISA::MachInst);
|
|
||||||
#endif
|
|
||||||
toCommit->branchMispredict[tid] = false;
|
toCommit->branchMispredict[tid] = false;
|
||||||
|
|
||||||
toCommit->includeSquashInst[tid] = false;
|
toCommit->includeSquashInst[tid] = false;
|
||||||
|
@ -532,11 +489,7 @@ DefaultIEW<Impl>::squashDueToMemBlocked(DynInstPtr &inst, unsigned tid)
|
||||||
toCommit->squash[tid] = true;
|
toCommit->squash[tid] = true;
|
||||||
toCommit->squashedSeqNum[tid] = inst->seqNum;
|
toCommit->squashedSeqNum[tid] = inst->seqNum;
|
||||||
toCommit->nextPC[tid] = inst->readPC();
|
toCommit->nextPC[tid] = inst->readPC();
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
toCommit->nextNPC[tid] = inst->readNextPC();
|
toCommit->nextNPC[tid] = inst->readNextPC();
|
||||||
#else
|
|
||||||
toCommit->nextNPC[tid] = inst->readPC() + sizeof(TheISA::MachInst);
|
|
||||||
#endif
|
|
||||||
toCommit->branchMispredict[tid] = false;
|
toCommit->branchMispredict[tid] = false;
|
||||||
|
|
||||||
// Must include the broadcasted SN in the squash.
|
// Must include the broadcasted SN in the squash.
|
||||||
|
@ -880,10 +833,8 @@ DefaultIEW<Impl>::sortInsts()
|
||||||
{
|
{
|
||||||
int insts_from_rename = fromRename->size;
|
int insts_from_rename = fromRename->size;
|
||||||
#ifdef DEBUG
|
#ifdef DEBUG
|
||||||
#if !ISA_HAS_DELAY_SLOT
|
|
||||||
for (int i = 0; i < numThreads; i++)
|
for (int i = 0; i < numThreads; i++)
|
||||||
assert(insts[i].empty());
|
assert(insts[i].empty());
|
||||||
#endif
|
|
||||||
#endif
|
#endif
|
||||||
for (int i = 0; i < insts_from_rename; ++i) {
|
for (int i = 0; i < insts_from_rename; ++i) {
|
||||||
insts[fromRename->insts[i]->threadNumber].push(fromRename->insts[i]);
|
insts[fromRename->insts[i]->threadNumber].push(fromRename->insts[i]);
|
||||||
|
@ -894,21 +845,9 @@ template <class Impl>
|
||||||
void
|
void
|
||||||
DefaultIEW<Impl>::emptyRenameInsts(unsigned tid)
|
DefaultIEW<Impl>::emptyRenameInsts(unsigned tid)
|
||||||
{
|
{
|
||||||
DPRINTF(IEW, "[tid:%i]: Removing incoming rename instructions until "
|
DPRINTF(IEW, "[tid:%i]: Removing incoming rename instructions\n", tid);
|
||||||
"[sn:%i].\n", tid, bdelayDoneSeqNum[tid]);
|
|
||||||
|
|
||||||
while (!insts[tid].empty()) {
|
while (!insts[tid].empty()) {
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
if (insts[tid].front()->seqNum <= bdelayDoneSeqNum[tid]) {
|
|
||||||
DPRINTF(IEW, "[tid:%i]: Done removing, cannot remove instruction"
|
|
||||||
" that occurs at or before delay slot [sn:%i].\n",
|
|
||||||
tid, bdelayDoneSeqNum[tid]);
|
|
||||||
break;
|
|
||||||
} else {
|
|
||||||
DPRINTF(IEW, "[tid:%i]: Removing incoming rename instruction "
|
|
||||||
"[sn:%i].\n", tid, insts[tid].front()->seqNum);
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
|
|
||||||
if (insts[tid].front()->isLoad() ||
|
if (insts[tid].front()->isLoad() ||
|
||||||
insts[tid].front()->isStore() ) {
|
insts[tid].front()->isStore() ) {
|
||||||
|
|
|
@ -1005,11 +1005,7 @@ InstructionQueue<Impl>::squash(unsigned tid)
|
||||||
|
|
||||||
// Read instruction sequence number of last instruction out of the
|
// Read instruction sequence number of last instruction out of the
|
||||||
// time buffer.
|
// time buffer.
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
squashedSeqNum[tid] = fromCommit->commitInfo[tid].bdelayDoneSeqNum;
|
|
||||||
#else
|
|
||||||
squashedSeqNum[tid] = fromCommit->commitInfo[tid].doneSeqNum;
|
squashedSeqNum[tid] = fromCommit->commitInfo[tid].doneSeqNum;
|
||||||
#endif
|
|
||||||
|
|
||||||
// Call doSquash if there are insts in the IQ
|
// Call doSquash if there are insts in the IQ
|
||||||
if (count[tid] > 0) {
|
if (count[tid] > 0) {
|
||||||
|
|
|
@ -69,10 +69,16 @@ class MipsDynInst : public BaseDynInst<Impl>
|
||||||
};
|
};
|
||||||
|
|
||||||
public:
|
public:
|
||||||
|
/** BaseDynInst constructor given a binary instruction. */
|
||||||
|
MipsDynInst(StaticInstPtr staticInst,
|
||||||
|
Addr PC, Addr NPC, Addr microPC,
|
||||||
|
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
|
||||||
|
InstSeqNum seq_num, O3CPU *cpu);
|
||||||
|
|
||||||
/** BaseDynInst constructor given a binary instruction. */
|
/** BaseDynInst constructor given a binary instruction. */
|
||||||
MipsDynInst(ExtMachInst inst,
|
MipsDynInst(ExtMachInst inst,
|
||||||
Addr PC, Addr NPC,
|
Addr PC, Addr NPC, Addr microPC,
|
||||||
Addr Pred_PC, Addr Pred_NPC,
|
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
|
||||||
InstSeqNum seq_num, O3CPU *cpu);
|
InstSeqNum seq_num, O3CPU *cpu);
|
||||||
|
|
||||||
/** BaseDynInst constructor given a static inst pointer. */
|
/** BaseDynInst constructor given a static inst pointer. */
|
||||||
|
|
|
@ -31,11 +31,23 @@
|
||||||
#include "cpu/o3/mips/dyn_inst.hh"
|
#include "cpu/o3/mips/dyn_inst.hh"
|
||||||
|
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
MipsDynInst<Impl>::MipsDynInst(ExtMachInst inst,
|
MipsDynInst<Impl>::MipsDynInst(StaticInstPtr staticInst,
|
||||||
Addr PC, Addr NPC,
|
Addr PC, Addr NPC, Addr microPC,
|
||||||
Addr Pred_PC, Addr Pred_NPC,
|
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
|
||||||
InstSeqNum seq_num, O3CPU *cpu)
|
InstSeqNum seq_num, O3CPU *cpu)
|
||||||
: BaseDynInst<Impl>(inst, PC, NPC, Pred_PC, Pred_NPC, seq_num, cpu)
|
: BaseDynInst<Impl>(staticInst, PC, NPC, microPC,
|
||||||
|
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
|
||||||
|
{
|
||||||
|
initVars();
|
||||||
|
}
|
||||||
|
|
||||||
|
template <class Impl>
|
||||||
|
MipsDynInst<Impl>::MipsDynInst(ExtMachInst inst,
|
||||||
|
Addr PC, Addr NPC, Addr microPC,
|
||||||
|
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
|
||||||
|
InstSeqNum seq_num, O3CPU *cpu)
|
||||||
|
: BaseDynInst<Impl>(inst, PC, NPC, microPC,
|
||||||
|
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
|
||||||
{
|
{
|
||||||
initVars();
|
initVars();
|
||||||
}
|
}
|
||||||
|
|
|
@ -179,7 +179,9 @@ class PhysRegFile
|
||||||
DPRINTF(IEW, "RegFile: Setting float register %i to %#x\n",
|
DPRINTF(IEW, "RegFile: Setting float register %i to %#x\n",
|
||||||
int(reg_idx), (uint64_t)val);
|
int(reg_idx), (uint64_t)val);
|
||||||
|
|
||||||
|
#if THE_ISA == ALPHA_ISA
|
||||||
if (reg_idx != TheISA::ZeroReg)
|
if (reg_idx != TheISA::ZeroReg)
|
||||||
|
#endif
|
||||||
floatRegFile[reg_idx].d = val;
|
floatRegFile[reg_idx].d = val;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -194,7 +196,9 @@ class PhysRegFile
|
||||||
DPRINTF(IEW, "RegFile: Setting float register %i to %#x\n",
|
DPRINTF(IEW, "RegFile: Setting float register %i to %#x\n",
|
||||||
int(reg_idx), (uint64_t)val);
|
int(reg_idx), (uint64_t)val);
|
||||||
|
|
||||||
|
#if THE_ISA == ALPHA_ISA
|
||||||
if (reg_idx != TheISA::ZeroReg)
|
if (reg_idx != TheISA::ZeroReg)
|
||||||
|
#endif
|
||||||
floatRegFile[reg_idx].d = val;
|
floatRegFile[reg_idx].d = val;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -356,47 +356,12 @@ DefaultRename<Impl>::squash(const InstSeqNum &squash_seq_num, unsigned tid)
|
||||||
}
|
}
|
||||||
|
|
||||||
// Clear the instruction list and skid buffer in case they have any
|
// Clear the instruction list and skid buffer in case they have any
|
||||||
// insts in them. Since we support multiple ISAs, we cant just:
|
// insts in them.
|
||||||
// "insts[tid].clear();" or "skidBuffer[tid].clear()" since there is
|
|
||||||
// a possible delay slot inst for different architectures
|
|
||||||
// insts[tid].clear();
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
DPRINTF(Rename, "[tid:%i] Squashing incoming decode instructions until "
|
|
||||||
"[sn:%i].\n",tid, squash_seq_num);
|
|
||||||
ListIt ilist_it = insts[tid].begin();
|
|
||||||
while (ilist_it != insts[tid].end()) {
|
|
||||||
if ((*ilist_it)->seqNum > squash_seq_num) {
|
|
||||||
(*ilist_it)->setSquashed();
|
|
||||||
DPRINTF(Rename, "Squashing incoming decode instruction, "
|
|
||||||
"[tid:%i] [sn:%i] PC %08p.\n", tid, (*ilist_it)->seqNum, (*ilist_it)->PC);
|
|
||||||
}
|
|
||||||
ilist_it++;
|
|
||||||
}
|
|
||||||
#else
|
|
||||||
insts[tid].clear();
|
insts[tid].clear();
|
||||||
#endif
|
|
||||||
|
|
||||||
// Clear the skid buffer in case it has any data in it.
|
// Clear the skid buffer in case it has any data in it.
|
||||||
// See comments above.
|
|
||||||
// skidBuffer[tid].clear();
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
|
||||||
DPRINTF(Rename, "[tid:%i] Squashing incoming skidbuffer instructions "
|
|
||||||
"until [sn:%i].\n", tid, squash_seq_num);
|
|
||||||
ListIt slist_it = skidBuffer[tid].begin();
|
|
||||||
while (slist_it != skidBuffer[tid].end()) {
|
|
||||||
if ((*slist_it)->seqNum > squash_seq_num) {
|
|
||||||
(*slist_it)->setSquashed();
|
|
||||||
DPRINTF(Rename, "Squashing skidbuffer instruction, [tid:%i] [sn:%i]"
|
|
||||||
"PC %08p.\n", tid, (*slist_it)->seqNum, (*slist_it)->PC);
|
|
||||||
}
|
|
||||||
slist_it++;
|
|
||||||
}
|
|
||||||
resumeUnblocking = (skidBuffer[tid].size() != 0);
|
|
||||||
DPRINTF(Rename, "Resume unblocking set to %s\n",
|
|
||||||
resumeUnblocking ? "true" : "false");
|
|
||||||
#else
|
|
||||||
skidBuffer[tid].clear();
|
skidBuffer[tid].clear();
|
||||||
#endif
|
|
||||||
doSquash(squash_seq_num, tid);
|
doSquash(squash_seq_num, tid);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -776,10 +741,8 @@ DefaultRename<Impl>::sortInsts()
|
||||||
{
|
{
|
||||||
int insts_from_decode = fromDecode->size;
|
int insts_from_decode = fromDecode->size;
|
||||||
#ifdef DEBUG
|
#ifdef DEBUG
|
||||||
#if !ISA_HAS_DELAY_SLOT
|
|
||||||
for (int i=0; i < numThreads; i++)
|
for (int i=0; i < numThreads; i++)
|
||||||
assert(insts[i].empty());
|
assert(insts[i].empty());
|
||||||
#endif
|
|
||||||
#endif
|
#endif
|
||||||
for (int i = 0; i < insts_from_decode; ++i) {
|
for (int i = 0; i < insts_from_decode; ++i) {
|
||||||
DynInstPtr inst = fromDecode->insts[i];
|
DynInstPtr inst = fromDecode->insts[i];
|
||||||
|
@ -1000,6 +963,7 @@ DefaultRename<Impl>::renameSrcRegs(DynInstPtr &inst,unsigned tid)
|
||||||
// Floating point and Miscellaneous registers need their indexes
|
// Floating point and Miscellaneous registers need their indexes
|
||||||
// adjusted to account for the expanded number of flattened int regs.
|
// adjusted to account for the expanded number of flattened int regs.
|
||||||
flat_src_reg = src_reg - TheISA::FP_Base_DepTag + TheISA::NumIntRegs;
|
flat_src_reg = src_reg - TheISA::FP_Base_DepTag + TheISA::NumIntRegs;
|
||||||
|
DPRINTF(Rename, "Adjusting reg index from %d to %d.\n", src_reg, flat_src_reg);
|
||||||
}
|
}
|
||||||
|
|
||||||
inst->flattenSrcReg(src_idx, flat_src_reg);
|
inst->flattenSrcReg(src_idx, flat_src_reg);
|
||||||
|
@ -1016,9 +980,11 @@ DefaultRename<Impl>::renameSrcRegs(DynInstPtr &inst,unsigned tid)
|
||||||
|
|
||||||
// See if the register is ready or not.
|
// See if the register is ready or not.
|
||||||
if (scoreboard->getReg(renamed_reg) == true) {
|
if (scoreboard->getReg(renamed_reg) == true) {
|
||||||
DPRINTF(Rename, "[tid:%u]: Register is ready.\n", tid);
|
DPRINTF(Rename, "[tid:%u]: Register %d is ready.\n", tid, renamed_reg);
|
||||||
|
|
||||||
inst->markSrcRegReady(src_idx);
|
inst->markSrcRegReady(src_idx);
|
||||||
|
} else {
|
||||||
|
DPRINTF(Rename, "[tid:%u]: Register %d is not ready.\n", tid, renamed_reg);
|
||||||
}
|
}
|
||||||
|
|
||||||
++renameRenameLookups;
|
++renameRenameLookups;
|
||||||
|
@ -1045,6 +1011,7 @@ DefaultRename<Impl>::renameDestRegs(DynInstPtr &inst,unsigned tid)
|
||||||
// Floating point and Miscellaneous registers need their indexes
|
// Floating point and Miscellaneous registers need their indexes
|
||||||
// adjusted to account for the expanded number of flattened int regs.
|
// adjusted to account for the expanded number of flattened int regs.
|
||||||
flat_dest_reg = dest_reg - TheISA::FP_Base_DepTag + TheISA::NumIntRegs;
|
flat_dest_reg = dest_reg - TheISA::FP_Base_DepTag + TheISA::NumIntRegs;
|
||||||
|
DPRINTF(Rename, "Adjusting reg index from %d to %d.\n", dest_reg, flat_dest_reg);
|
||||||
}
|
}
|
||||||
|
|
||||||
inst->flattenDestReg(dest_idx, flat_dest_reg);
|
inst->flattenDestReg(dest_idx, flat_dest_reg);
|
||||||
|
@ -1248,13 +1215,7 @@ DefaultRename<Impl>::checkSignalsAndUpdate(unsigned tid)
|
||||||
DPRINTF(Rename, "[tid:%u]: Squashing instructions due to squash from "
|
DPRINTF(Rename, "[tid:%u]: Squashing instructions due to squash from "
|
||||||
"commit.\n", tid);
|
"commit.\n", tid);
|
||||||
|
|
||||||
#if ISA_HAS_DELAY_SLOT
|
squash(fromCommit->commitInfo[tid].doneSeqNum, tid);
|
||||||
InstSeqNum squashed_seq_num = fromCommit->commitInfo[tid].bdelayDoneSeqNum;
|
|
||||||
#else
|
|
||||||
InstSeqNum squashed_seq_num = fromCommit->commitInfo[tid].doneSeqNum;
|
|
||||||
#endif
|
|
||||||
|
|
||||||
squash(squashed_seq_num, tid);
|
|
||||||
|
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
|
@ -165,17 +165,21 @@ SimpleRenameMap::rename(RegIndex arch_reg)
|
||||||
|
|
||||||
// If it's not referencing the zero register, then rename the
|
// If it's not referencing the zero register, then rename the
|
||||||
// register.
|
// register.
|
||||||
|
#if THE_ISA == ALPHA_ISA
|
||||||
if (arch_reg != floatZeroReg) {
|
if (arch_reg != floatZeroReg) {
|
||||||
|
#endif
|
||||||
renamed_reg = freeList->getFloatReg();
|
renamed_reg = freeList->getFloatReg();
|
||||||
|
|
||||||
floatRenameMap[arch_reg].physical_reg = renamed_reg;
|
floatRenameMap[arch_reg].physical_reg = renamed_reg;
|
||||||
|
|
||||||
assert(renamed_reg < numPhysicalRegs &&
|
assert(renamed_reg < numPhysicalRegs &&
|
||||||
renamed_reg >= numPhysicalIntRegs);
|
renamed_reg >= numPhysicalIntRegs);
|
||||||
|
#if THE_ISA == ALPHA_ISA
|
||||||
} else {
|
} else {
|
||||||
// Otherwise return the zero register so nothing bad happens.
|
// Otherwise return the zero register so nothing bad happens.
|
||||||
renamed_reg = floatZeroReg;
|
renamed_reg = floatZeroReg;
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
} else {
|
} else {
|
||||||
// Subtract off the base offset for miscellaneous registers.
|
// Subtract off the base offset for miscellaneous registers.
|
||||||
arch_reg = arch_reg - numLogicalRegs;
|
arch_reg = arch_reg - numLogicalRegs;
|
||||||
|
|
|
@ -29,6 +29,7 @@
|
||||||
* Kevin Lim
|
* Kevin Lim
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
#include "arch/isa_specific.hh"
|
||||||
#include "cpu/o3/scoreboard.hh"
|
#include "cpu/o3/scoreboard.hh"
|
||||||
|
|
||||||
Scoreboard::Scoreboard(unsigned activeThreads,
|
Scoreboard::Scoreboard(unsigned activeThreads,
|
||||||
|
@ -79,11 +80,18 @@ Scoreboard::name() const
|
||||||
bool
|
bool
|
||||||
Scoreboard::getReg(PhysRegIndex phys_reg)
|
Scoreboard::getReg(PhysRegIndex phys_reg)
|
||||||
{
|
{
|
||||||
|
#if THE_ISA == ALPHA_ISA
|
||||||
// Always ready if int or fp zero reg.
|
// Always ready if int or fp zero reg.
|
||||||
if (phys_reg == zeroRegIdx ||
|
if (phys_reg == zeroRegIdx ||
|
||||||
phys_reg == (zeroRegIdx + numPhysicalIntRegs)) {
|
phys_reg == (zeroRegIdx + numPhysicalIntRegs)) {
|
||||||
return 1;
|
return 1;
|
||||||
}
|
}
|
||||||
|
#else
|
||||||
|
// Always ready if int zero reg.
|
||||||
|
if (phys_reg == zeroRegIdx) {
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
return regScoreBoard[phys_reg];
|
return regScoreBoard[phys_reg];
|
||||||
}
|
}
|
||||||
|
@ -99,11 +107,18 @@ Scoreboard::setReg(PhysRegIndex phys_reg)
|
||||||
void
|
void
|
||||||
Scoreboard::unsetReg(PhysRegIndex ready_reg)
|
Scoreboard::unsetReg(PhysRegIndex ready_reg)
|
||||||
{
|
{
|
||||||
|
#if THE_ISA == ALPHA_ISA
|
||||||
if (ready_reg == zeroRegIdx ||
|
if (ready_reg == zeroRegIdx ||
|
||||||
ready_reg == (zeroRegIdx + numPhysicalIntRegs)) {
|
ready_reg == (zeroRegIdx + numPhysicalIntRegs)) {
|
||||||
// Don't do anything if int or fp zero reg.
|
// Don't do anything if int or fp zero reg.
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
#else
|
||||||
|
if (ready_reg == zeroRegIdx) {
|
||||||
|
// Don't do anything if int zero reg.
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
regScoreBoard[ready_reg] = 0;
|
regScoreBoard[ready_reg] = 0;
|
||||||
}
|
}
|
||||||
|
|
|
@ -56,8 +56,14 @@ class SparcDynInst : public BaseDynInst<Impl>
|
||||||
|
|
||||||
public:
|
public:
|
||||||
/** BaseDynInst constructor given a binary instruction. */
|
/** BaseDynInst constructor given a binary instruction. */
|
||||||
SparcDynInst(TheISA::ExtMachInst inst, Addr PC, Addr NPC,
|
SparcDynInst(StaticInstPtr staticInst, Addr PC, Addr NPC, Addr microPC,
|
||||||
Addr Pred_PC, Addr Pred_NPC, InstSeqNum seq_num, O3CPU *cpu);
|
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
|
||||||
|
InstSeqNum seq_num, O3CPU *cpu);
|
||||||
|
|
||||||
|
/** BaseDynInst constructor given a binary instruction. */
|
||||||
|
SparcDynInst(TheISA::ExtMachInst inst, Addr PC, Addr NPC, Addr microPC,
|
||||||
|
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
|
||||||
|
InstSeqNum seq_num, O3CPU *cpu);
|
||||||
|
|
||||||
/** BaseDynInst constructor given a static inst pointer. */
|
/** BaseDynInst constructor given a static inst pointer. */
|
||||||
SparcDynInst(StaticInstPtr &_staticInst);
|
SparcDynInst(StaticInstPtr &_staticInst);
|
||||||
|
|
|
@ -31,10 +31,23 @@
|
||||||
#include "cpu/o3/sparc/dyn_inst.hh"
|
#include "cpu/o3/sparc/dyn_inst.hh"
|
||||||
|
|
||||||
template <class Impl>
|
template <class Impl>
|
||||||
SparcDynInst<Impl>::SparcDynInst(TheISA::ExtMachInst inst,
|
SparcDynInst<Impl>::SparcDynInst(StaticInstPtr staticInst,
|
||||||
Addr PC, Addr NPC, Addr Pred_PC, Addr Pred_NPC,
|
Addr PC, Addr NPC, Addr microPC,
|
||||||
|
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
|
||||||
InstSeqNum seq_num, O3CPU *cpu)
|
InstSeqNum seq_num, O3CPU *cpu)
|
||||||
: BaseDynInst<Impl>(inst, PC, NPC, Pred_PC, Pred_NPC, seq_num, cpu)
|
: BaseDynInst<Impl>(staticInst, PC, NPC, microPC,
|
||||||
|
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
|
||||||
|
{
|
||||||
|
initVars();
|
||||||
|
}
|
||||||
|
|
||||||
|
template <class Impl>
|
||||||
|
SparcDynInst<Impl>::SparcDynInst(TheISA::ExtMachInst inst,
|
||||||
|
Addr PC, Addr NPC, Addr microPC,
|
||||||
|
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
|
||||||
|
InstSeqNum seq_num, O3CPU *cpu)
|
||||||
|
: BaseDynInst<Impl>(inst, PC, NPC, microPC,
|
||||||
|
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
|
||||||
{
|
{
|
||||||
initVars();
|
initVars();
|
||||||
}
|
}
|
||||||
|
|
|
@ -29,5 +29,5 @@
|
||||||
m5.AddToPath('../configs/common')
|
m5.AddToPath('../configs/common')
|
||||||
from cpu2000 import mcf
|
from cpu2000 import mcf
|
||||||
|
|
||||||
workload = mcf(isa, opsys, 'lgred')
|
workload = mcf(isa, opsys, 'smred')
|
||||||
root.system.cpu.workload = workload.makeLiveProcess()
|
root.system.cpu.workload = workload.makeLiveProcess()
|
||||||
|
|
Loading…
Reference in a new issue