Merge vm1.(none):/home/stever/bk/newmem-head

into  vm1.(none):/home/stever/bk/newmem-cache2

--HG--
extra : convert_revision : aa50af3094f5d459f75b514179b6e3ec5e0bf1df
This commit is contained in:
Steve Reinhardt 2007-06-22 16:13:53 -07:00
commit ed1db23b41
68 changed files with 4383 additions and 7289 deletions

View file

@ -57,10 +57,12 @@ let {{
addrCalcImm = 'EA = Rs1 + imm;'
iop = InstObjParams(name, Name, 'Mem',
{"code": code, "postacc_code" : postacc_code,
"fault_check": faultCode, "ea_code": addrCalcReg}, opt_flags)
"fault_check": faultCode, "ea_code": addrCalcReg,
"EA_trunc": TruncateEA}, opt_flags)
iop_imm = InstObjParams(name, Name + "Imm", 'MemImm',
{"code": code, "postacc_code" : postacc_code,
"fault_check": faultCode, "ea_code": addrCalcImm}, opt_flags)
"fault_check": faultCode, "ea_code": addrCalcImm,
"EA_trunc": TruncateEA}, opt_flags)
header_output = MemDeclare.subst(iop) + MemDeclare.subst(iop_imm)
decoder_output = BasicConstructor.subst(iop) + BasicConstructor.subst(iop_imm)
decode_block = ROrImmDecode.subst(iop)

View file

@ -298,11 +298,13 @@ let {{
iop = InstObjParams(name, Name, 'BlockMem',
{"code": pcedCode, "ea_code": addrCalcReg,
"fault_check": faultCode, "micro_pc": microPc,
"set_flags": flag_code}, opt_flags)
"set_flags": flag_code, "EA_trunc" : TruncateEA},
opt_flags)
iop_imm = InstObjParams(name, Name + 'Imm', 'BlockMemImm',
{"code": pcedCode, "ea_code": addrCalcImm,
"fault_check": faultCode, "micro_pc": microPc,
"set_flags": flag_code}, opt_flags)
"set_flags": flag_code, "EA_trunc" : TruncateEA},
opt_flags)
decoder_output += BlockMemMicroConstructor.subst(iop)
decoder_output += BlockMemMicroConstructor.subst(iop_imm)
exec_output += doDualSplitExecute(

View file

@ -51,6 +51,7 @@ def template SwapExecute {{
}
if(storeCond && fault == NoFault)
{
%(EA_trunc)s
fault = xc->write((uint%(mem_acc_size)s_t)Mem,
EA, %(asi_val)s, &mem_data);
}
@ -91,6 +92,7 @@ def template SwapInitiateAcc {{
}
if(fault == NoFault)
{
%(EA_trunc)s
fault = xc->write((uint%(mem_acc_size)s_t)Mem,
EA, %(asi_val)s, &mem_data);
}
@ -157,12 +159,14 @@ let {{
addrCalcReg = 'EA = Rs1;'
iop = InstObjParams(name, Name, 'Mem',
{"code": code, "postacc_code" : postacc_code,
"fault_check": faultCode, "ea_code": addrCalcReg}, opt_flags)
"fault_check": faultCode, "ea_code": addrCalcReg,
"EA_trunc" : TruncateEA}, opt_flags)
header_output = MemDeclare.subst(iop)
decoder_output = BasicConstructor.subst(iop)
decode_block = BasicDecode.subst(iop)
microParams = {"code": code, "postacc_code" : postacc_code,
"ea_code" : addrCalcReg, "fault_check" : faultCode}
"ea_code" : addrCalcReg, "fault_check" : faultCode,
"EA_trunc" : TruncateEA}
exec_output = doSplitExecute(execute, name, Name, asi,
["IsStoreConditional"], microParams);
return (header_output, decoder_output, exec_output, decode_block)

View file

@ -149,6 +149,7 @@ def template LoadExecute {{
%(fault_check)s;
if(fault == NoFault)
{
%(EA_trunc)s
fault = xc->read(EA, (%(mem_acc_type)s%(mem_acc_size)s_t&)Mem, %(asi_val)s);
}
if(fault == NoFault)
@ -179,6 +180,7 @@ def template LoadInitiateAcc {{
%(fault_check)s;
if(fault == NoFault)
{
%(EA_trunc)s
fault = xc->read(EA, (%(mem_acc_type)s%(mem_acc_size)s_t&)Mem, %(asi_val)s);
}
return fault;
@ -224,6 +226,7 @@ def template StoreExecute {{
}
if(storeCond && fault == NoFault)
{
%(EA_trunc)s
fault = xc->write((%(mem_acc_type)s%(mem_acc_size)s_t)Mem,
EA, %(asi_val)s, 0);
}
@ -257,6 +260,7 @@ def template StoreInitiateAcc {{
}
if(storeCond && fault == NoFault)
{
%(EA_trunc)s
fault = xc->write((%(mem_acc_type)s%(mem_acc_size)s_t)Mem,
EA, %(asi_val)s, 0);
}
@ -317,6 +321,11 @@ let {{
fault = new PrivilegedAction;
'''
TruncateEA = '''
#if !FULL_SYSTEM
EA = Pstate<3:> ? EA<31:0> : EA;
#endif
'''
}};
//A simple function to generate the name of the macro op of a certain
@ -346,7 +355,8 @@ let {{
(eaRegCode, nameReg, NameReg),
(eaImmCode, nameImm, NameImm)):
microParams = {"code": code, "postacc_code" : postacc_code,
"ea_code": eaCode, "fault_check": faultCode}
"ea_code": eaCode, "fault_check": faultCode,
"EA_trunc" : TruncateEA}
executeCode += doSplitExecute(execute, name, Name,
asi, opt_flags, microParams)
return executeCode

View file

@ -149,7 +149,8 @@ def operands {{
'Fprs': ('ControlReg', 'udw', 'MISCREG_FPRS', None, 43),
'Pcr': ('ControlReg', 'udw', 'MISCREG_PCR', None, 44),
'Pic': ('ControlReg', 'udw', 'MISCREG_PIC', None, 45),
'Gsr': ('ControlReg', 'udw', 'MISCREG_GSR', None, 46),
# 'Gsr': ('ControlReg', 'udw', 'MISCREG_GSR', (None, None, ['IsSerializeAfter','IsSerializing','IsNonSpeculative']), 46),
'Gsr': ('IntReg', 'udw', 'NumIntArchRegs + 8', None, 46),
'Softint': ('ControlReg', 'udw', 'MISCREG_SOFTINT', None, 47),
'SoftintSet': ('ControlReg', 'udw', 'MISCREG_SOFTINT_SET', None, 48),
'SoftintClr': ('ControlReg', 'udw', 'MISCREG_SOFTINT_CLR', None, 49),
@ -187,7 +188,7 @@ def operands {{
'Hver': ('ControlReg', 'udw', 'MISCREG_HVER', None, 74),
'StrandStsReg': ('ControlReg', 'udw', 'MISCREG_STRAND_STS_REG', None, 75),
'Fsr': ('ControlReg', 'udw', 'MISCREG_FSR', None, 80),
'Fsr': ('ControlReg', 'udw', 'MISCREG_FSR', (None, None, ['IsSerializeAfter','IsSerializing','IsNonSpeculative']), 80),
# Mem gets a large number so it's always last
'Mem': ('Mem', 'udw', None, ('IsMemRef', 'IsLoad', 'IsStore'), 100)

View file

@ -58,7 +58,7 @@ namespace SparcISA
// These enumerate all the registers for dependence tracking.
enum DependenceTags {
FP_Base_DepTag = 32*3+8,
FP_Base_DepTag = 32*3+9,
Ctrl_Base_DepTag = FP_Base_DepTag + 64
};

View file

@ -88,8 +88,8 @@ Sparc32LiveProcess::startup()
//From the SPARC ABI
//The process runs in user mode
threadContexts[0]->setMiscReg(MISCREG_PSTATE, 0x02);
//The process runs in user mode with 32 bit addresses
threadContexts[0]->setMiscReg(MISCREG_PSTATE, 0x0a);
//Setup default FP state
threadContexts[0]->setMiscRegNoEffect(MISCREG_FSR, 0);

View file

@ -42,7 +42,7 @@ namespace SparcISA
// Number of register windows, can legally be 3 to 32
const int NWindows = 8;
//const int NumMicroIntRegs = 1;
const int NumMicroIntRegs = 8;
const int NumMicroIntRegs = 9;
// const int NumRegularIntRegs = MaxGL * 8 + NWindows * 16;
// const int NumMicroIntRegs = 1;

View file

@ -59,7 +59,7 @@ namespace SparcISA
typedef int RegContextVal;
typedef uint8_t RegIndex;
typedef uint16_t RegIndex;
}
#endif

View file

@ -103,7 +103,6 @@ output header {{
#include "base/misc.hh"
#include "cpu/static_inst.hh"
#include "mem/packet.hh"
#include "mem/request.hh" // some constructors use MemReq flags
#include "sim/faults.hh"
}};

View file

@ -61,8 +61,8 @@ def macroop CALL_I
limm t2, imm
rdip t1
subi "INTREG_RSP", "INTREG_RSP", dsz
st t1, ss, [0, t0, "INTREG_RSP"]
subi rsp, rsp, dsz
st t1, ss, [0, t0, rsp]
wrip t1, t2
};
'''

View file

@ -58,16 +58,16 @@ def macroop POP_R {
# Make the default data size of pops 64 bits in 64 bit mode
.adjust_env oszIn64Override
ld reg, ss, [0, t0, "INTREG_RSP"]
addi "INTREG_RSP", "INTREG_RSP", dsz
ld reg, ss, [0, t0, rsp]
addi rsp, rsp, dsz
};
def macroop PUSH_R {
# Make the default data size of pops 64 bits in 64 bit mode
.adjust_env oszIn64Override
subi "INTREG_RSP", "INTREG_RSP", dsz
st reg, ss, [0, t0, "INTREG_RSP"]
subi rsp, rsp, dsz
st reg, ss, [0, t0, rsp]
};
'''
#let {{

View file

@ -91,6 +91,9 @@ let {{
"osz" : "env.operandSize",
"ssz" : "env.stackSize"
}
for reg in ('ax', 'bx', 'cx', 'dx', 'sp', 'bp', 'si', 'di'):
assembler.symbols["r%s" % reg] = "INTREG_R%s" % reg.upper()
assembler.symbols.update(symbols)
# Code literal which forces a default 64 bit operand size in 64 bit mode.

View file

@ -209,6 +209,9 @@ class BaseDynInst : public FastAlloc, public RefCounted
/** PC of this instruction. */
Addr PC;
/** Micro PC of this instruction. */
Addr microPC;
protected:
/** Next non-speculative PC. It is not filled in at fetch, but rather
* once the target of the branch is truly known (either decode or
@ -219,12 +222,18 @@ class BaseDynInst : public FastAlloc, public RefCounted
/** Next non-speculative NPC. Target PC for Mips or Sparc. */
Addr nextNPC;
/** Next non-speculative micro PC. */
Addr nextMicroPC;
/** Predicted next PC. */
Addr predPC;
/** Predicted next NPC. */
Addr predNPC;
/** Predicted next microPC */
Addr predMicroPC;
/** If this is a branch that was predicted taken */
bool predTaken;
@ -340,6 +349,17 @@ class BaseDynInst : public FastAlloc, public RefCounted
{
_flatDestRegIdx[idx] = flattened_dest;
}
/** BaseDynInst constructor given a binary instruction.
* @param staticInst A StaticInstPtr to the underlying instruction.
* @param PC The PC of the instruction.
* @param pred_PC The predicted next PC.
* @param pred_NPC The predicted next NPC.
* @param seq_num The sequence number of the instruction.
* @param cpu Pointer to the instruction's CPU.
*/
BaseDynInst(StaticInstPtr staticInst, Addr PC, Addr NPC, Addr microPC,
Addr pred_PC, Addr pred_NPC, Addr pred_MicroPC,
InstSeqNum seq_num, ImplCPU *cpu);
/** BaseDynInst constructor given a binary instruction.
* @param inst The binary instruction.
@ -349,8 +369,8 @@ class BaseDynInst : public FastAlloc, public RefCounted
* @param seq_num The sequence number of the instruction.
* @param cpu Pointer to the instruction's CPU.
*/
BaseDynInst(TheISA::ExtMachInst inst, Addr PC, Addr NPC,
Addr pred_PC, Addr pred_NPC,
BaseDynInst(TheISA::ExtMachInst inst, Addr PC, Addr NPC, Addr microPC,
Addr pred_PC, Addr pred_NPC, Addr pred_MicroPC,
InstSeqNum seq_num, ImplCPU *cpu);
/** BaseDynInst constructor given a StaticInst pointer.
@ -402,11 +422,18 @@ class BaseDynInst : public FastAlloc, public RefCounted
#endif
}
Addr readNextMicroPC()
{
return nextMicroPC;
}
/** Set the predicted target of this current instruction. */
void setPredTarg(Addr predicted_PC, Addr predicted_NPC)
void setPredTarg(Addr predicted_PC, Addr predicted_NPC,
Addr predicted_MicroPC)
{
predPC = predicted_PC;
predNPC = predicted_NPC;
predMicroPC = predicted_MicroPC;
}
/** Returns the predicted PC immediately after the branch. */
@ -415,6 +442,9 @@ class BaseDynInst : public FastAlloc, public RefCounted
/** Returns the predicted PC two instructions after the branch */
Addr readPredNPC() { return predNPC; }
/** Returns the predicted micro PC after the branch */
Addr readPredMicroPC() { return predMicroPC; }
/** Returns whether the instruction was predicted taken or not. */
bool readPredTaken()
{
@ -430,7 +460,8 @@ class BaseDynInst : public FastAlloc, public RefCounted
bool mispredicted()
{
return readPredPC() != readNextPC() ||
readPredNPC() != readNextNPC();
readPredNPC() != readNextNPC() ||
readPredMicroPC() != readNextMicroPC();
}
//
@ -467,6 +498,12 @@ class BaseDynInst : public FastAlloc, public RefCounted
bool isQuiesce() const { return staticInst->isQuiesce(); }
bool isIprAccess() const { return staticInst->isIprAccess(); }
bool isUnverifiable() const { return staticInst->isUnverifiable(); }
bool isMacroop() const { return staticInst->isMacroop(); }
bool isMicroop() const { return staticInst->isMicroop(); }
bool isDelayedCommit() const { return staticInst->isDelayedCommit(); }
bool isLastMicroop() const { return staticInst->isLastMicroop(); }
bool isFirstMicroop() const { return staticInst->isFirstMicroop(); }
bool isMicroBranch() const { return staticInst->isMicroBranch(); }
/** Temporarily sets this instruction as a serialize before instruction. */
void setSerializeBefore() { status.set(SerializeBefore); }
@ -700,16 +737,26 @@ class BaseDynInst : public FastAlloc, public RefCounted
/** Read the PC of this instruction. */
const Addr readPC() const { return PC; }
/**Read the micro PC of this instruction. */
const Addr readMicroPC() const { return microPC; }
/** Set the next PC of this instruction (its actual target). */
void setNextPC(uint64_t val)
void setNextPC(Addr val)
{
nextPC = val;
}
/** Set the next NPC of this instruction (the target in Mips or Sparc).*/
void setNextNPC(uint64_t val)
void setNextNPC(Addr val)
{
#if ISA_HAS_DELAY_SLOT
nextNPC = val;
#endif
}
void setNextMicroPC(Addr val)
{
nextMicroPC = val;
}
/** Sets the ASID. */

View file

@ -62,19 +62,66 @@ my_hash_t thishash;
#endif
template <class Impl>
BaseDynInst<Impl>::BaseDynInst(TheISA::ExtMachInst machInst,
BaseDynInst<Impl>::BaseDynInst(StaticInstPtr _staticInst,
Addr inst_PC, Addr inst_NPC,
Addr inst_MicroPC,
Addr pred_PC, Addr pred_NPC,
Addr pred_MicroPC,
InstSeqNum seq_num, ImplCPU *cpu)
: staticInst(machInst, inst_PC), traceData(NULL), cpu(cpu)
: staticInst(_staticInst), traceData(NULL), cpu(cpu)
{
seqNum = seq_num;
bool nextIsMicro =
staticInst->isMicroop() && !staticInst->isLastMicroop();
PC = inst_PC;
nextPC = inst_NPC;
nextNPC = nextPC + sizeof(TheISA::MachInst);
microPC = inst_MicroPC;
if (nextIsMicro) {
nextPC = inst_PC;
nextNPC = inst_NPC;
nextMicroPC = microPC + 1;
} else {
nextPC = inst_NPC;
nextNPC = nextPC + sizeof(TheISA::MachInst);
nextMicroPC = 0;
}
predPC = pred_PC;
predNPC = pred_NPC;
predMicroPC = pred_MicroPC;
predTaken = false;
initVars();
}
template <class Impl>
BaseDynInst<Impl>::BaseDynInst(TheISA::ExtMachInst inst,
Addr inst_PC, Addr inst_NPC,
Addr inst_MicroPC,
Addr pred_PC, Addr pred_NPC,
Addr pred_MicroPC,
InstSeqNum seq_num, ImplCPU *cpu)
: staticInst(inst, inst_PC), traceData(NULL), cpu(cpu)
{
seqNum = seq_num;
bool nextIsMicro =
staticInst->isMicroop() && !staticInst->isLastMicroop();
PC = inst_PC;
microPC = inst_MicroPC;
if (nextIsMicro) {
nextPC = inst_PC;
nextNPC = inst_NPC;
nextMicroPC = microPC + 1;
} else {
nextPC = inst_NPC;
nextNPC = nextPC + sizeof(TheISA::MachInst);
nextMicroPC = 0;
}
predPC = pred_PC;
predNPC = pred_NPC;
predMicroPC = pred_MicroPC;
predTaken = false;
initVars();

View file

@ -73,8 +73,13 @@ class AlphaDynInst : public BaseDynInst<Impl>
public:
/** BaseDynInst constructor given a binary instruction. */
AlphaDynInst(ExtMachInst inst, Addr PC, Addr NPC,
Addr Pred_PC, Addr Pred_NPC,
AlphaDynInst(StaticInstPtr staticInst, Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu);
/** BaseDynInst constructor given a binary instruction. */
AlphaDynInst(ExtMachInst inst, Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu);
/** BaseDynInst constructor given a static inst pointer. */

View file

@ -31,10 +31,25 @@
#include "cpu/o3/alpha/dyn_inst.hh"
template <class Impl>
AlphaDynInst<Impl>::AlphaDynInst(ExtMachInst inst, Addr PC, Addr NPC,
AlphaDynInst<Impl>::AlphaDynInst(StaticInstPtr staticInst,
Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC,
Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu)
: BaseDynInst<Impl>(inst, PC, NPC, Pred_PC, Pred_NPC, seq_num, cpu)
: BaseDynInst<Impl>(staticInst, PC, NPC, microPC,
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
{
initVars();
}
template <class Impl>
AlphaDynInst<Impl>::AlphaDynInst(ExtMachInst inst,
Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC,
Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu)
: BaseDynInst<Impl>(inst, PC, NPC, microPC,
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
{
initVars();
}

View file

@ -87,10 +87,10 @@ struct DefaultIEWDefaultCommit {
bool squash[Impl::MaxThreads];
bool branchMispredict[Impl::MaxThreads];
bool branchTaken[Impl::MaxThreads];
bool squashDelaySlot[Impl::MaxThreads];
uint64_t mispredPC[Impl::MaxThreads];
uint64_t nextPC[Impl::MaxThreads];
uint64_t nextNPC[Impl::MaxThreads];
Addr mispredPC[Impl::MaxThreads];
Addr nextPC[Impl::MaxThreads];
Addr nextNPC[Impl::MaxThreads];
Addr nextMicroPC[Impl::MaxThreads];
InstSeqNum squashedSeqNum[Impl::MaxThreads];
bool includeSquashInst[Impl::MaxThreads];
@ -114,15 +114,15 @@ struct TimeBufStruct {
uint64_t branchAddr;
InstSeqNum doneSeqNum;
InstSeqNum bdelayDoneSeqNum;
// @todo: Might want to package this kind of branch stuff into a single
// struct as it is used pretty frequently.
bool branchMispredict;
bool branchTaken;
uint64_t mispredPC;
uint64_t nextPC;
uint64_t nextNPC;
Addr mispredPC;
Addr nextPC;
Addr nextNPC;
Addr nextMicroPC;
unsigned branchCount;
};
@ -160,18 +160,16 @@ struct TimeBufStruct {
bool branchMispredict;
bool branchTaken;
uint64_t mispredPC;
uint64_t nextPC;
uint64_t nextNPC;
Addr mispredPC;
Addr nextPC;
Addr nextNPC;
Addr nextMicroPC;
// Represents the instruction that has either been retired or
// squashed. Similar to having a single bus that broadcasts the
// retired or squashed sequence number.
InstSeqNum doneSeqNum;
InstSeqNum bdelayDoneSeqNum;
bool squashDelaySlot;
//Just in case we want to do a commit/squash on a cycle
//(necessary for multiple ROBs?)
bool commitInsts;

View file

@ -279,25 +279,37 @@ class DefaultCommit
/** Returns the PC of the head instruction of the ROB.
* @todo: Probably remove this function as it returns only thread 0.
*/
uint64_t readPC() { return PC[0]; }
Addr readPC() { return PC[0]; }
/** Returns the PC of a specific thread. */
uint64_t readPC(unsigned tid) { return PC[tid]; }
Addr readPC(unsigned tid) { return PC[tid]; }
/** Sets the PC of a specific thread. */
void setPC(uint64_t val, unsigned tid) { PC[tid] = val; }
void setPC(Addr val, unsigned tid) { PC[tid] = val; }
/** Reads the micro PC of a specific thread. */
Addr readMicroPC(unsigned tid) { return microPC[tid]; }
/** Sets the micro PC of a specific thread */
void setMicroPC(Addr val, unsigned tid) { microPC[tid] = val; }
/** Reads the next PC of a specific thread. */
uint64_t readNextPC(unsigned tid) { return nextPC[tid]; }
Addr readNextPC(unsigned tid) { return nextPC[tid]; }
/** Sets the next PC of a specific thread. */
void setNextPC(uint64_t val, unsigned tid) { nextPC[tid] = val; }
void setNextPC(Addr val, unsigned tid) { nextPC[tid] = val; }
/** Reads the next NPC of a specific thread. */
uint64_t readNextNPC(unsigned tid) { return nextNPC[tid]; }
Addr readNextNPC(unsigned tid) { return nextNPC[tid]; }
/** Sets the next NPC of a specific thread. */
void setNextNPC(uint64_t val, unsigned tid) { nextNPC[tid] = val; }
void setNextNPC(Addr val, unsigned tid) { nextNPC[tid] = val; }
/** Reads the micro PC of a specific thread. */
Addr readNextMicroPC(unsigned tid) { return nextMicroPC[tid]; }
/** Sets the micro PC of a specific thread */
void setNextMicroPC(Addr val, unsigned tid) { nextMicroPC[tid] = val; }
private:
/** Time buffer interface. */
@ -402,12 +414,20 @@ class DefaultCommit
*/
Addr PC[Impl::MaxThreads];
/** The commit micro PC of each thread. Refers to the instruction that
* is currently being processed/committed.
*/
Addr microPC[Impl::MaxThreads];
/** The next PC of each thread. */
Addr nextPC[Impl::MaxThreads];
/** The next NPC of each thread. */
Addr nextNPC[Impl::MaxThreads];
/** The next micro PC of each thread. */
Addr nextMicroPC[Impl::MaxThreads];
/** The sequence number of the youngest valid instruction in the ROB. */
InstSeqNum youngestSeqNum[Impl::MaxThreads];

View file

@ -124,7 +124,7 @@ DefaultCommit<Impl>::DefaultCommit(O3CPU *_cpu, Params *params)
committedStores[i] = false;
trapSquash[i] = false;
tcSquash[i] = false;
PC[i] = nextPC[i] = nextNPC[i] = 0;
microPC[i] = nextMicroPC[i] = PC[i] = nextPC[i] = nextNPC[i] = 0;
}
#if FULL_SYSTEM
interrupt = NoFault;
@ -508,6 +508,7 @@ DefaultCommit<Impl>::squashAll(unsigned tid)
toIEW->commitInfo[tid].nextPC = PC[tid];
toIEW->commitInfo[tid].nextNPC = nextPC[tid];
toIEW->commitInfo[tid].nextMicroPC = nextMicroPC[tid];
}
template <class Impl>
@ -738,38 +739,15 @@ DefaultCommit<Impl>::commit()
// then use one older sequence number.
InstSeqNum squashed_inst = fromIEW->squashedSeqNum[tid];
#if ISA_HAS_DELAY_SLOT
InstSeqNum bdelay_done_seq_num = squashed_inst;
bool squash_bdelay_slot = fromIEW->squashDelaySlot[tid];
bool branchMispredict = fromIEW->branchMispredict[tid];
// Squashing/not squashing the branch delay slot only makes
// sense when you're squashing from a branch, ie from a branch
// mispredict.
if (branchMispredict && !squash_bdelay_slot) {
bdelay_done_seq_num++;
}
#endif
if (fromIEW->includeSquashInst[tid] == true) {
squashed_inst--;
#if ISA_HAS_DELAY_SLOT
bdelay_done_seq_num--;
#endif
}
// All younger instructions will be squashed. Set the sequence
// number as the youngest instruction in the ROB.
youngestSeqNum[tid] = squashed_inst;
#if ISA_HAS_DELAY_SLOT
rob->squash(bdelay_done_seq_num, tid);
toIEW->commitInfo[tid].squashDelaySlot = squash_bdelay_slot;
toIEW->commitInfo[tid].bdelayDoneSeqNum = bdelay_done_seq_num;
#else
rob->squash(squashed_inst, tid);
toIEW->commitInfo[tid].squashDelaySlot = true;
#endif
changedROBNumEntries[tid] = true;
toIEW->commitInfo[tid].doneSeqNum = squashed_inst;
@ -788,6 +766,7 @@ DefaultCommit<Impl>::commit()
toIEW->commitInfo[tid].nextPC = fromIEW->nextPC[tid];
toIEW->commitInfo[tid].nextNPC = fromIEW->nextNPC[tid];
toIEW->commitInfo[tid].nextMicroPC = fromIEW->nextMicroPC[tid];
toIEW->commitInfo[tid].mispredPC = fromIEW->mispredPC[tid];
@ -806,10 +785,6 @@ DefaultCommit<Impl>::commit()
// Try to commit any instructions.
commitInsts();
} else {
#if ISA_HAS_DELAY_SLOT
skidInsert();
#endif
}
//Check for any activity
@ -901,6 +876,7 @@ DefaultCommit<Impl>::commitInsts()
PC[tid] = head_inst->readPC();
nextPC[tid] = head_inst->readNextPC();
nextNPC[tid] = head_inst->readNextNPC();
nextMicroPC[tid] = head_inst->readNextMicroPC();
// Increment the total number of non-speculative instructions
// executed.
@ -929,12 +905,10 @@ DefaultCommit<Impl>::commitInsts()
}
PC[tid] = nextPC[tid];
#if ISA_HAS_DELAY_SLOT
nextPC[tid] = nextNPC[tid];
nextNPC[tid] = nextNPC[tid] + sizeof(TheISA::MachInst);
#else
nextPC[tid] = nextPC[tid] + sizeof(TheISA::MachInst);
#endif
microPC[tid] = nextMicroPC[tid];
nextMicroPC[tid] = microPC[tid] + 1;
#if FULL_SYSTEM
int count = 0;
@ -1161,37 +1135,13 @@ DefaultCommit<Impl>::getInsts()
{
DPRINTF(Commit, "Getting instructions from Rename stage.\n");
#if ISA_HAS_DELAY_SLOT
// Read any renamed instructions and place them into the ROB.
int insts_to_process = std::min((int)renameWidth,
(int)(fromRename->size + skidBuffer.size()));
int rename_idx = 0;
DPRINTF(Commit, "%i insts available to process. Rename Insts:%i "
"SkidBuffer Insts:%i\n", insts_to_process, fromRename->size,
skidBuffer.size());
#else
// Read any renamed instructions and place them into the ROB.
int insts_to_process = std::min((int)renameWidth, fromRename->size);
#endif
for (int inst_num = 0; inst_num < insts_to_process; ++inst_num) {
DynInstPtr inst;
#if ISA_HAS_DELAY_SLOT
// Get insts from skidBuffer or from Rename
if (skidBuffer.size() > 0) {
DPRINTF(Commit, "Grabbing skidbuffer inst.\n");
inst = skidBuffer.front();
skidBuffer.pop();
} else {
DPRINTF(Commit, "Grabbing rename inst.\n");
inst = fromRename->insts[rename_idx++];
}
#else
inst = fromRename->insts[inst_num];
#endif
int tid = inst->threadNumber;
if (!inst->isSquashed() &&
@ -1213,30 +1163,6 @@ DefaultCommit<Impl>::getInsts()
inst->readPC(), inst->seqNum, tid);
}
}
#if ISA_HAS_DELAY_SLOT
if (rename_idx < fromRename->size) {
DPRINTF(Commit,"Placing Rename Insts into skidBuffer.\n");
for (;
rename_idx < fromRename->size;
rename_idx++) {
DynInstPtr inst = fromRename->insts[rename_idx];
if (!inst->isSquashed()) {
DPRINTF(Commit, "Inserting PC %#x [sn:%i] [tid:%i] into ",
"skidBuffer.\n", inst->readPC(), inst->seqNum,
inst->threadNumber);
skidBuffer.push(inst);
} else {
DPRINTF(Commit, "Instruction PC %#x [sn:%i] [tid:%i] was "
"squashed, skipping.\n",
inst->readPC(), inst->seqNum, inst->threadNumber);
}
}
}
#endif
}
template <class Impl>

View file

@ -694,7 +694,7 @@ FullO3CPU<Impl>::removeThread(unsigned tid)
// Squash Throughout Pipeline
InstSeqNum squash_seq_num = commit.rob->readHeadInst(tid)->seqNum;
fetch.squash(0, sizeof(TheISA::MachInst), squash_seq_num, true, tid);
fetch.squash(0, sizeof(TheISA::MachInst), 0, squash_seq_num, tid);
decode.squash(tid);
rename.squash(squash_seq_num, tid);
iew.squash(tid);
@ -1148,6 +1148,20 @@ FullO3CPU<Impl>::setPC(Addr new_PC,unsigned tid)
commit.setPC(new_PC, tid);
}
template <class Impl>
uint64_t
FullO3CPU<Impl>::readMicroPC(unsigned tid)
{
return commit.readMicroPC(tid);
}
template <class Impl>
void
FullO3CPU<Impl>::setMicroPC(Addr new_PC,unsigned tid)
{
commit.setMicroPC(new_PC, tid);
}
template <class Impl>
uint64_t
FullO3CPU<Impl>::readNextPC(unsigned tid)
@ -1176,6 +1190,20 @@ FullO3CPU<Impl>::setNextNPC(uint64_t val,unsigned tid)
commit.setNextNPC(val, tid);
}
template <class Impl>
uint64_t
FullO3CPU<Impl>::readNextMicroPC(unsigned tid)
{
return commit.readNextMicroPC(tid);
}
template <class Impl>
void
FullO3CPU<Impl>::setNextMicroPC(Addr new_PC,unsigned tid)
{
commit.setNextMicroPC(new_PC, tid);
}
template <class Impl>
typename FullO3CPU<Impl>::ListIt
FullO3CPU<Impl>::addInst(DynInstPtr &inst)
@ -1224,9 +1252,7 @@ FullO3CPU<Impl>::removeFrontInst(DynInstPtr &inst)
template <class Impl>
void
FullO3CPU<Impl>::removeInstsNotInROB(unsigned tid,
bool squash_delay_slot,
const InstSeqNum &delay_slot_seq_num)
FullO3CPU<Impl>::removeInstsNotInROB(unsigned tid)
{
DPRINTF(O3CPU, "Thread %i: Deleting instructions from instruction"
" list.\n", tid);
@ -1257,12 +1283,6 @@ FullO3CPU<Impl>::removeInstsNotInROB(unsigned tid,
while (inst_it != end_it) {
assert(!instList.empty());
#if ISA_HAS_DELAY_SLOT
if(!squash_delay_slot &&
delay_slot_seq_num >= (*inst_it)->seqNum) {
break;
}
#endif
squashInstIt(inst_it, tid);
inst_it--;

View file

@ -434,22 +434,34 @@ class FullO3CPU : public BaseO3CPU
void setArchFloatRegInt(int reg_idx, uint64_t val, unsigned tid);
/** Reads the commit PC of a specific thread. */
uint64_t readPC(unsigned tid);
Addr readPC(unsigned tid);
/** Sets the commit PC of a specific thread. */
void setPC(Addr new_PC, unsigned tid);
/** Reads the commit micro PC of a specific thread. */
Addr readMicroPC(unsigned tid);
/** Sets the commmit micro PC of a specific thread. */
void setMicroPC(Addr new_microPC, unsigned tid);
/** Reads the next PC of a specific thread. */
uint64_t readNextPC(unsigned tid);
Addr readNextPC(unsigned tid);
/** Sets the next PC of a specific thread. */
void setNextPC(uint64_t val, unsigned tid);
void setNextPC(Addr val, unsigned tid);
/** Reads the next NPC of a specific thread. */
uint64_t readNextNPC(unsigned tid);
Addr readNextNPC(unsigned tid);
/** Sets the next NPC of a specific thread. */
void setNextNPC(uint64_t val, unsigned tid);
void setNextNPC(Addr val, unsigned tid);
/** Reads the commit next micro PC of a specific thread. */
Addr readNextMicroPC(unsigned tid);
/** Sets the commit next micro PC of a specific thread. */
void setNextMicroPC(Addr val, unsigned tid);
/** Function to add instruction onto the head of the list of the
* instructions. Used when new instructions are fetched.
@ -469,8 +481,7 @@ class FullO3CPU : public BaseO3CPU
/** Remove all instructions that are not currently in the ROB.
* There's also an option to not squash delay slot instructions.*/
void removeInstsNotInROB(unsigned tid, bool squash_delay_slot,
const InstSeqNum &delay_slot_seq_num);
void removeInstsNotInROB(unsigned tid);
/** Remove all instructions younger than the given sequence number. */
void removeInstsUntil(const InstSeqNum &seq_num,unsigned tid);

View file

@ -49,8 +49,6 @@ DefaultDecode<Impl>::DefaultDecode(O3CPU *_cpu, Params *params)
stalls[i].rename = false;
stalls[i].iew = false;
stalls[i].commit = false;
squashAfterDelaySlot[i] = false;
}
// @todo: Make into a parameter
@ -275,20 +273,16 @@ DefaultDecode<Impl>::squash(DynInstPtr &inst, unsigned tid)
///explicitly for ISAs with delay slots.
toFetch->decodeInfo[tid].nextNPC =
inst->branchTarget() + sizeof(TheISA::MachInst);
toFetch->decodeInfo[tid].nextMicroPC = inst->readMicroPC();
#if ISA_HAS_DELAY_SLOT
toFetch->decodeInfo[tid].branchTaken = inst->readNextNPC() !=
(inst->readNextPC() + sizeof(TheISA::MachInst));
toFetch->decodeInfo[tid].bdelayDoneSeqNum = bdelayDoneSeqNum[tid];
squashAfterDelaySlot[tid] = false;
InstSeqNum squash_seq_num = bdelayDoneSeqNum[tid];
#else
toFetch->decodeInfo[tid].branchTaken =
inst->readNextPC() != (inst->readPC() + sizeof(TheISA::MachInst));
#endif
InstSeqNum squash_seq_num = inst->seqNum;
#endif
// Might have to tell fetch to unblock.
if (decodeStatus[tid] == Blocked ||
@ -309,30 +303,10 @@ DefaultDecode<Impl>::squash(DynInstPtr &inst, unsigned tid)
// Clear the instruction list and skid buffer in case they have any
// insts in them.
while (!insts[tid].empty()) {
#if ISA_HAS_DELAY_SLOT
if (insts[tid].front()->seqNum <= squash_seq_num) {
DPRINTF(Decode, "[tid:%i]: Cannot remove incoming decode "
"instructions before delay slot [sn:%i]. %i insts"
"left in decode.\n", tid, squash_seq_num,
insts[tid].size());
break;
}
#endif
insts[tid].pop();
}
while (!skidBuffer[tid].empty()) {
#if ISA_HAS_DELAY_SLOT
if (skidBuffer[tid].front()->seqNum <= squash_seq_num) {
DPRINTF(Decode, "[tid:%i]: Cannot remove skidBuffer "
"instructions before delay slot [sn:%i]. %i insts"
"left in decode.\n", tid, squash_seq_num,
insts[tid].size());
break;
}
#endif
skidBuffer[tid].pop();
}
@ -760,48 +734,13 @@ DefaultDecode<Impl>::decodeInsts(unsigned tid)
// Might want to set some sort of boolean and just do
// a check at the end
#if !ISA_HAS_DELAY_SLOT
squash(inst, inst->threadNumber);
Addr target = inst->branchTarget();
inst->setPredTarg(target, target + sizeof(TheISA::MachInst));
//The micro pc after an instruction level branch should be 0
inst->setPredTarg(target, target + sizeof(TheISA::MachInst), 0);
break;
#else
// If mispredicted as taken, then ignore delay slot
// instruction... else keep delay slot and squash
// after it is sent to rename
if (inst->readPredTaken() && inst->isCondDelaySlot()) {
DPRINTF(Decode, "[tid:%i]: Conditional delay slot inst."
"[sn:%i] PC %#x mispredicted as taken.\n", tid,
inst->seqNum, inst->PC);
bdelayDoneSeqNum[tid] = inst->seqNum;
squash(inst, inst->threadNumber);
Addr target = inst->branchTarget();
inst->setPredTarg(target,
target + sizeof(TheISA::MachInst));
break;
} else {
DPRINTF(Decode, "[tid:%i]: Misprediction detected at "
"[sn:%i] PC %#x, will squash after delay slot "
"inst. is sent to Rename\n",
tid, inst->seqNum, inst->PC);
bdelayDoneSeqNum[tid] = inst->seqNum + 1;
squashAfterDelaySlot[tid] = true;
squashInst[tid] = inst;
continue;
}
#endif
}
}
if (squashAfterDelaySlot[tid]) {
assert(!inst->isSquashed());
squash(squashInst[tid], squashInst[tid]->threadNumber);
Addr target = squashInst[tid]->branchTarget();
squashInst[tid]->setPredTarg(target,
target + sizeof(TheISA::MachInst));
assert(!inst->isSquashed());
break;
}
}
// If we didn't process all instructions, then we will need to block

View file

@ -227,7 +227,7 @@ class DefaultFetch
* @param next_NPC Used for ISAs which use delay slots.
* @return Whether or not a branch was predicted as taken.
*/
bool lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC, Addr &next_NPC);
bool lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC, Addr &next_NPC, Addr &next_MicroPC);
/**
* Fetches the cache line that contains fetch_PC. Returns any
@ -242,12 +242,14 @@ class DefaultFetch
bool fetchCacheLine(Addr fetch_PC, Fault &ret_fault, unsigned tid);
/** Squashes a specific thread and resets the PC. */
inline void doSquash(const Addr &new_PC, const Addr &new_NPC, unsigned tid);
inline void doSquash(const Addr &new_PC, const Addr &new_NPC,
const Addr &new_MicroPC, unsigned tid);
/** Squashes a specific thread and resets the PC. Also tells the CPU to
* remove any instructions between fetch and decode that should be sqaushed.
*/
void squashFromDecode(const Addr &new_PC, const Addr &new_NPC,
const Addr &new_MicroPC,
const InstSeqNum &seq_num, unsigned tid);
/** Checks if a thread is stalled. */
@ -263,8 +265,8 @@ class DefaultFetch
* squash should be the commit stage.
*/
void squash(const Addr &new_PC, const Addr &new_NPC,
const InstSeqNum &seq_num,
bool squash_delay_slot, unsigned tid);
const Addr &new_MicroPC,
const InstSeqNum &seq_num, unsigned tid);
/** Ticks the fetch stage, processing all inputs signals and fetching
* as many instructions as possible.
@ -347,16 +349,12 @@ class DefaultFetch
/** Per-thread fetch PC. */
Addr PC[Impl::MaxThreads];
/** Per-thread fetch micro PC. */
Addr microPC[Impl::MaxThreads];
/** Per-thread next PC. */
Addr nextPC[Impl::MaxThreads];
/** Per-thread next Next PC.
* This is not a real register but is used for
* architectures that use a branch-delay slot.
* (such as MIPS or Sparc)
*/
Addr nextNPC[Impl::MaxThreads];
/** Memory request used to access cache. */
RequestPtr memReq[Impl::MaxThreads];

View file

@ -313,7 +313,7 @@ DefaultFetch<Impl>::initStage()
for (int tid = 0; tid < numThreads; tid++) {
PC[tid] = cpu->readPC(tid);
nextPC[tid] = cpu->readNextPC(tid);
nextNPC[tid] = cpu->readNextNPC(tid);
microPC[tid] = cpu->readMicroPC(tid);
}
for (int tid=0; tid < numThreads; tid++) {
@ -440,11 +440,7 @@ DefaultFetch<Impl>::takeOverFrom()
stalls[i].commit = 0;
PC[i] = cpu->readPC(i);
nextPC[i] = cpu->readNextPC(i);
#if ISA_HAS_DELAY_SLOT
nextNPC[i] = cpu->readNextNPC(i);
#else
nextNPC[i] = nextPC[i] + sizeof(TheISA::MachInst);
#endif
microPC[i] = cpu->readMicroPC(i);
fetchStatus[i] = Running;
}
numInst = 0;
@ -494,7 +490,7 @@ DefaultFetch<Impl>::switchToInactive()
template <class Impl>
bool
DefaultFetch<Impl>::lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC,
Addr &next_NPC)
Addr &next_NPC, Addr &next_MicroPC)
{
// Do branch prediction check here.
// A bit of a misnomer...next_PC is actually the current PC until
@ -502,13 +498,22 @@ DefaultFetch<Impl>::lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC,
bool predict_taken;
if (!inst->isControl()) {
next_PC = next_NPC;
next_NPC = next_NPC + instSize;
inst->setPredTarg(next_PC, next_NPC);
if (inst->isMicroop() && !inst->isLastMicroop()) {
next_MicroPC++;
} else {
next_PC = next_NPC;
next_NPC = next_NPC + instSize;
next_MicroPC = 0;
}
inst->setPredTarg(next_PC, next_NPC, next_MicroPC);
inst->setPredTaken(false);
return false;
}
//Assume for now that all control flow is to a different macroop which
//would reset the micro pc to 0.
next_MicroPC = 0;
int tid = inst->threadNumber;
Addr pred_PC = next_PC;
predict_taken = branchPred.predict(inst, pred_PC, tid);
@ -535,7 +540,7 @@ DefaultFetch<Impl>::lookupAndUpdateNextPC(DynInstPtr &inst, Addr &next_PC,
#endif
/* DPRINTF(Fetch, "[tid:%i]: Branch predicted to go to %#x and then %#x.\n",
tid, next_PC, next_NPC);*/
inst->setPredTarg(next_PC, next_NPC);
inst->setPredTarg(next_PC, next_NPC, next_MicroPC);
inst->setPredTaken(predict_taken);
++fetchedBranches;
@ -659,14 +664,14 @@ DefaultFetch<Impl>::fetchCacheLine(Addr fetch_PC, Fault &ret_fault, unsigned tid
template <class Impl>
inline void
DefaultFetch<Impl>::doSquash(const Addr &new_PC,
const Addr &new_NPC, unsigned tid)
const Addr &new_NPC, const Addr &new_microPC, unsigned tid)
{
DPRINTF(Fetch, "[tid:%i]: Squashing, setting PC to: %#x, NPC to: %#x.\n",
tid, new_PC, new_NPC);
PC[tid] = new_PC;
nextPC[tid] = new_NPC;
nextNPC[tid] = new_NPC + instSize;
microPC[tid] = new_microPC;
// Clear the icache miss if it's outstanding.
if (fetchStatus[tid] == IcacheWaitResponse) {
@ -694,12 +699,12 @@ DefaultFetch<Impl>::doSquash(const Addr &new_PC,
template<class Impl>
void
DefaultFetch<Impl>::squashFromDecode(const Addr &new_PC, const Addr &new_NPC,
const InstSeqNum &seq_num,
unsigned tid)
const Addr &new_MicroPC,
const InstSeqNum &seq_num, unsigned tid)
{
DPRINTF(Fetch, "[tid:%i]: Squashing from decode.\n",tid);
doSquash(new_PC, new_NPC, tid);
doSquash(new_PC, new_NPC, new_MicroPC, tid);
// Tell the CPU to remove any instructions that are in flight between
// fetch and decode.
@ -775,20 +780,15 @@ DefaultFetch<Impl>::updateFetchStatus()
template <class Impl>
void
DefaultFetch<Impl>::squash(const Addr &new_PC, const Addr &new_NPC,
const InstSeqNum &seq_num,
bool squash_delay_slot, unsigned tid)
const Addr &new_MicroPC,
const InstSeqNum &seq_num, unsigned tid)
{
DPRINTF(Fetch, "[tid:%u]: Squash from commit.\n",tid);
doSquash(new_PC, new_NPC, tid);
doSquash(new_PC, new_NPC, new_MicroPC, tid);
#if ISA_HAS_DELAY_SLOT
// Tell the CPU to remove any instructions that are not in the ROB.
cpu->removeInstsNotInROB(tid, squash_delay_slot, seq_num);
#else
// Tell the CPU to remove any instructions that are not in the ROB.
cpu->removeInstsNotInROB(tid, true, 0);
#endif
cpu->removeInstsNotInROB(tid);
}
template <class Impl>
@ -897,17 +897,11 @@ DefaultFetch<Impl>::checkSignalsAndUpdate(unsigned tid)
DPRINTF(Fetch, "[tid:%u]: Squashing instructions due to squash "
"from commit.\n",tid);
#if ISA_HAS_DELAY_SLOT
InstSeqNum doneSeqNum = fromCommit->commitInfo[tid].bdelayDoneSeqNum;
#else
InstSeqNum doneSeqNum = fromCommit->commitInfo[tid].doneSeqNum;
#endif
// In any case, squash.
squash(fromCommit->commitInfo[tid].nextPC,
fromCommit->commitInfo[tid].nextNPC,
doneSeqNum,
fromCommit->commitInfo[tid].squashDelaySlot,
fromCommit->commitInfo[tid].nextMicroPC,
fromCommit->commitInfo[tid].doneSeqNum,
tid);
// Also check if there's a mispredict that happened.
@ -956,18 +950,14 @@ DefaultFetch<Impl>::checkSignalsAndUpdate(unsigned tid)
if (fetchStatus[tid] != Squashing) {
#if ISA_HAS_DELAY_SLOT
InstSeqNum doneSeqNum = fromDecode->decodeInfo[tid].bdelayDoneSeqNum;
#else
InstSeqNum doneSeqNum = fromDecode->decodeInfo[tid].doneSeqNum;
#endif
DPRINTF(Fetch, "Squashing from decode with PC = %#x, NPC = %#x\n",
fromDecode->decodeInfo[tid].nextPC,
fromDecode->decodeInfo[tid].nextNPC);
// Squash unless we're already squashing
squashFromDecode(fromDecode->decodeInfo[tid].nextPC,
fromDecode->decodeInfo[tid].nextNPC,
doneSeqNum,
fromDecode->decodeInfo[tid].nextMicroPC,
fromDecode->decodeInfo[tid].doneSeqNum,
tid);
return true;
@ -1021,9 +1011,9 @@ DefaultFetch<Impl>::fetch(bool &status_change)
DPRINTF(Fetch, "Attempting to fetch from [tid:%i]\n", tid);
// The current PC.
Addr &fetch_PC = PC[tid];
Addr &fetch_NPC = nextPC[tid];
Addr fetch_PC = PC[tid];
Addr fetch_NPC = nextPC[tid];
Addr fetch_MicroPC = microPC[tid];
// Fault code for memory access.
Fault fault = NoFault;
@ -1082,6 +1072,7 @@ DefaultFetch<Impl>::fetch(bool &status_change)
Addr next_PC = fetch_PC;
Addr next_NPC = fetch_NPC;
Addr next_MicroPC = fetch_MicroPC;
InstSeqNum inst_seq;
MachInst inst;
@ -1089,6 +1080,9 @@ DefaultFetch<Impl>::fetch(bool &status_change)
// @todo: Fix this hack.
unsigned offset = (fetch_PC & cacheBlkMask) & ~3;
StaticInstPtr staticInst = NULL;
StaticInstPtr macroop = NULL;
if (fault == NoFault) {
// If the read of the first instruction was successful, then grab the
// instructions from the rest of the cache line and put them into the
@ -1101,11 +1095,9 @@ DefaultFetch<Impl>::fetch(bool &status_change)
// ended this fetch block.
bool predicted_branch = false;
for (;
offset < cacheBlkSize &&
numInst < fetchWidth &&
!predicted_branch;
++numInst) {
while (offset < cacheBlkSize &&
numInst < fetchWidth &&
!predicted_branch) {
// If we're branching after this instruction, quite fetching
// from the same block then.
@ -1116,95 +1108,107 @@ DefaultFetch<Impl>::fetch(bool &status_change)
fetch_PC, fetch_NPC);
}
// Get a sequence number.
inst_seq = cpu->getAndIncrementInstSeq();
// Make sure this is a valid index.
assert(offset <= cacheBlkSize - instSize);
// Get the instruction from the array of the cache line.
inst = TheISA::gtoh(*reinterpret_cast<TheISA::MachInst *>
(&cacheData[tid][offset]));
if (!macroop) {
// Get the instruction from the array of the cache line.
inst = TheISA::gtoh(*reinterpret_cast<TheISA::MachInst *>
(&cacheData[tid][offset]));
predecoder.setTC(cpu->thread[tid]->getTC());
predecoder.moreBytes(fetch_PC, fetch_PC, inst);
predecoder.setTC(cpu->thread[tid]->getTC());
predecoder.moreBytes(fetch_PC, fetch_PC, inst);
ext_inst = predecoder.getExtMachInst();
ext_inst = predecoder.getExtMachInst();
staticInst = StaticInstPtr(ext_inst, fetch_PC);
if (staticInst->isMacroop())
macroop = staticInst;
}
do {
if (macroop) {
staticInst = macroop->fetchMicroop(fetch_MicroPC);
if (staticInst->isLastMicroop())
macroop = NULL;
}
// Create a new DynInst from the instruction fetched.
DynInstPtr instruction = new DynInst(ext_inst,
fetch_PC, fetch_NPC,
next_PC, next_NPC,
inst_seq, cpu);
instruction->setTid(tid);
// Get a sequence number.
inst_seq = cpu->getAndIncrementInstSeq();
instruction->setASID(tid);
// Create a new DynInst from the instruction fetched.
DynInstPtr instruction = new DynInst(staticInst,
fetch_PC, fetch_NPC, fetch_MicroPC,
next_PC, next_NPC, next_MicroPC,
inst_seq, cpu);
instruction->setTid(tid);
instruction->setThreadState(cpu->thread[tid]);
instruction->setASID(tid);
DPRINTF(Fetch, "[tid:%i]: Instruction PC %#x created "
"[sn:%lli]\n",
tid, instruction->readPC(), inst_seq);
instruction->setThreadState(cpu->thread[tid]);
//DPRINTF(Fetch, "[tid:%i]: MachInst is %#x\n", tid, ext_inst);
DPRINTF(Fetch, "[tid:%i]: Instruction PC %#x created "
"[sn:%lli]\n",
tid, instruction->readPC(), inst_seq);
DPRINTF(Fetch, "[tid:%i]: Instruction is: %s\n",
tid, instruction->staticInst->disassemble(fetch_PC));
//DPRINTF(Fetch, "[tid:%i]: MachInst is %#x\n", tid, ext_inst);
DPRINTF(Fetch, "[tid:%i]: Instruction is: %s\n",
tid, instruction->staticInst->disassemble(fetch_PC));
#if TRACING_ON
instruction->traceData =
Trace::getInstRecord(curTick, cpu->tcBase(tid),
instruction->staticInst,
instruction->readPC());
instruction->traceData =
Trace::getInstRecord(curTick, cpu->tcBase(tid),
instruction->staticInst,
instruction->readPC());
#else
instruction->traceData = NULL;
instruction->traceData = NULL;
#endif
///FIXME This needs to be more robust in dealing with delay slots
#if !ISA_HAS_DELAY_SLOT
// predicted_branch |=
#endif
lookupAndUpdateNextPC(instruction, next_PC, next_NPC);
predicted_branch |= (next_PC != fetch_NPC);
///FIXME This needs to be more robust in dealing with delay slots
predicted_branch |=
lookupAndUpdateNextPC(instruction, next_PC, next_NPC, next_MicroPC);
// Add instruction to the CPU's list of instructions.
instruction->setInstListIt(cpu->addInst(instruction));
// Add instruction to the CPU's list of instructions.
instruction->setInstListIt(cpu->addInst(instruction));
// Write the instruction to the first slot in the queue
// that heads to decode.
toDecode->insts[numInst] = instruction;
// Write the instruction to the first slot in the queue
// that heads to decode.
toDecode->insts[numInst] = instruction;
toDecode->size++;
toDecode->size++;
// Increment stat of fetched instructions.
++fetchedInsts;
// Increment stat of fetched instructions.
++fetchedInsts;
// Move to the next instruction, unless we have a branch.
fetch_PC = next_PC;
fetch_NPC = next_NPC;
// Move to the next instruction, unless we have a branch.
fetch_PC = next_PC;
fetch_NPC = next_NPC;
fetch_MicroPC = next_MicroPC;
if (instruction->isQuiesce()) {
DPRINTF(Fetch, "Quiesce instruction encountered, halting fetch!",
curTick);
fetchStatus[tid] = QuiescePending;
++numInst;
status_change = true;
break;
}
if (instruction->isQuiesce()) {
DPRINTF(Fetch, "Quiesce instruction encountered, halting fetch!",
curTick);
fetchStatus[tid] = QuiescePending;
++numInst;
status_change = true;
break;
}
} while (staticInst->isMicroop() &&
!staticInst->isLastMicroop() &&
numInst < fetchWidth);
offset += instSize;
}
if (offset >= cacheBlkSize) {
DPRINTF(Fetch, "[tid:%i]: Done fetching, reached the end of cache "
"block.\n", tid);
if (predicted_branch) {
DPRINTF(Fetch, "[tid:%i]: Done fetching, predicted branch "
"instruction encountered.\n", tid);
} else if (numInst >= fetchWidth) {
DPRINTF(Fetch, "[tid:%i]: Done fetching, reached fetch bandwidth "
"for this cycle.\n", tid);
} else if (predicted_branch) {
DPRINTF(Fetch, "[tid:%i]: Done fetching, predicted branch "
"instruction encountered.\n", tid);
} else if (offset >= cacheBlkSize) {
DPRINTF(Fetch, "[tid:%i]: Done fetching, reached the end of cache "
"block.\n", tid);
}
}
@ -1217,12 +1221,8 @@ DefaultFetch<Impl>::fetch(bool &status_change)
if (fault == NoFault) {
PC[tid] = next_PC;
nextPC[tid] = next_NPC;
nextNPC[tid] = next_NPC + instSize;
#if ISA_HAS_DELAY_SLOT
DPRINTF(Fetch, "[tid:%i]: Setting PC to %08p.\n", tid, PC[tid]);
#else
microPC[tid] = next_MicroPC;
DPRINTF(Fetch, "[tid:%i]: Setting PC to %08p.\n", tid, next_PC);
#endif
} else {
// We shouldn't be in an icache miss and also have a fault (an ITB
// miss)
@ -1242,10 +1242,10 @@ DefaultFetch<Impl>::fetch(bool &status_change)
// Create a new DynInst from the dummy nop.
DynInstPtr instruction = new DynInst(ext_inst,
fetch_PC, fetch_NPC,
next_PC, next_NPC,
fetch_PC, fetch_NPC, fetch_MicroPC,
next_PC, next_NPC, next_MicroPC,
inst_seq, cpu);
instruction->setPredTarg(next_PC, next_NPC);
instruction->setPredTarg(next_PC, next_NPC, 1);
instruction->setTid(tid);
instruction->setASID(tid);

View file

@ -168,7 +168,9 @@ SimpleFreeList::addReg(PhysRegIndex freed_reg)
if (freed_reg != TheISA::ZeroReg)
freeIntRegs.push(freed_reg);
} else if (freed_reg < numPhysicalRegs) {
#if THE_ISA == ALPHA_ISA
if (freed_reg != (TheISA::ZeroReg + numPhysicalIntRegs))
#endif
freeFloatRegs.push(freed_reg);
}
}

View file

@ -402,9 +402,6 @@ class DefaultIEW
/** Records if there is a fetch redirect on this cycle for each thread. */
bool fetchRedirect[Impl::MaxThreads];
/** Keeps track of the last valid branch delay slot instss for threads */
InstSeqNum bdelayDoneSeqNum[Impl::MaxThreads];
/** Used to track if all instructions have been dispatched this cycle.
* If they have not, then blocking must have occurred, and the instructions
* would already be added to the skid buffer.

View file

@ -69,7 +69,6 @@ DefaultIEW<Impl>::DefaultIEW(O3CPU *_cpu, Params *params)
dispatchStatus[i] = Running;
stalls[i].commit = false;
fetchRedirect[i] = false;
bdelayDoneSeqNum[i] = 0;
}
wbMax = wbWidth * params->wbDepth;
@ -410,31 +409,14 @@ DefaultIEW<Impl>::squash(unsigned tid)
instQueue.squash(tid);
// Tell the LDSTQ to start squashing.
#if ISA_HAS_DELAY_SLOT
ldstQueue.squash(fromCommit->commitInfo[tid].bdelayDoneSeqNum, tid);
#else
ldstQueue.squash(fromCommit->commitInfo[tid].doneSeqNum, tid);
#endif
updatedQueues = true;
// Clear the skid buffer in case it has any data in it.
DPRINTF(IEW, "[tid:%i]: Removing skidbuffer instructions until [sn:%i].\n",
tid, fromCommit->commitInfo[tid].bdelayDoneSeqNum);
tid, fromCommit->commitInfo[tid].doneSeqNum);
while (!skidBuffer[tid].empty()) {
#if ISA_HAS_DELAY_SLOT
if (skidBuffer[tid].front()->seqNum <=
fromCommit->commitInfo[tid].bdelayDoneSeqNum) {
DPRINTF(IEW, "[tid:%i]: Cannot remove skidbuffer instructions "
"that occur before delay slot [sn:%i].\n",
fromCommit->commitInfo[tid].bdelayDoneSeqNum,
tid);
break;
} else {
DPRINTF(IEW, "[tid:%i]: Removing instruction [sn:%i] from "
"skidBuffer.\n", tid, skidBuffer[tid].front()->seqNum);
}
#endif
if (skidBuffer[tid].front()->isLoad() ||
skidBuffer[tid].front()->isStore() ) {
toRename->iewInfo[tid].dispatchedToLSQ++;
@ -445,8 +427,6 @@ DefaultIEW<Impl>::squash(unsigned tid)
skidBuffer[tid].pop();
}
bdelayDoneSeqNum[tid] = fromCommit->commitInfo[tid].bdelayDoneSeqNum;
emptyRenameInsts(tid);
}
@ -462,38 +442,19 @@ DefaultIEW<Impl>::squashDueToBranch(DynInstPtr &inst, unsigned tid)
toCommit->mispredPC[tid] = inst->readPC();
toCommit->branchMispredict[tid] = true;
int instSize = sizeof(TheISA::MachInst);
#if ISA_HAS_DELAY_SLOT
bool branch_taken =
int instSize = sizeof(TheISA::MachInst);
toCommit->branchTaken[tid] =
!(inst->readNextPC() + instSize == inst->readNextNPC() &&
(inst->readNextPC() == inst->readPC() + instSize ||
inst->readNextPC() == inst->readPC() + 2 * instSize));
DPRINTF(Sparc, "Branch taken = %s [sn:%i]\n",
branch_taken ? "true": "false", inst->seqNum);
toCommit->branchTaken[tid] = branch_taken;
bool squashDelaySlot = true;
// (inst->readNextPC() != inst->readPC() + sizeof(TheISA::MachInst));
DPRINTF(Sparc, "Squash delay slot = %s [sn:%i]\n",
squashDelaySlot ? "true": "false", inst->seqNum);
toCommit->squashDelaySlot[tid] = squashDelaySlot;
//If we're squashing the delay slot, we need to pick back up at NextPC.
//Otherwise, NextPC isn't being squashed, so we should pick back up at
//NextNPC.
if (squashDelaySlot) {
toCommit->nextPC[tid] = inst->readNextPC();
toCommit->nextNPC[tid] = inst->readNextNPC();
} else {
toCommit->nextPC[tid] = inst->readNextNPC();
toCommit->nextNPC[tid] = inst->readNextNPC() + instSize;
}
#else
toCommit->branchTaken[tid] = inst->readNextPC() !=
(inst->readPC() + sizeof(TheISA::MachInst));
toCommit->nextPC[tid] = inst->readNextPC();
toCommit->nextNPC[tid] = inst->readNextPC() + instSize;
#endif
toCommit->nextPC[tid] = inst->readNextPC();
toCommit->nextNPC[tid] = inst->readNextNPC();
toCommit->nextMicroPC[tid] = inst->readNextMicroPC();
toCommit->includeSquashInst[tid] = false;
@ -510,11 +471,7 @@ DefaultIEW<Impl>::squashDueToMemOrder(DynInstPtr &inst, unsigned tid)
toCommit->squash[tid] = true;
toCommit->squashedSeqNum[tid] = inst->seqNum;
toCommit->nextPC[tid] = inst->readNextPC();
#if ISA_HAS_DELAY_SLOT
toCommit->nextNPC[tid] = inst->readNextNPC();
#else
toCommit->nextNPC[tid] = inst->readNextPC() + sizeof(TheISA::MachInst);
#endif
toCommit->branchMispredict[tid] = false;
toCommit->includeSquashInst[tid] = false;
@ -532,11 +489,7 @@ DefaultIEW<Impl>::squashDueToMemBlocked(DynInstPtr &inst, unsigned tid)
toCommit->squash[tid] = true;
toCommit->squashedSeqNum[tid] = inst->seqNum;
toCommit->nextPC[tid] = inst->readPC();
#if ISA_HAS_DELAY_SLOT
toCommit->nextNPC[tid] = inst->readNextPC();
#else
toCommit->nextNPC[tid] = inst->readPC() + sizeof(TheISA::MachInst);
#endif
toCommit->branchMispredict[tid] = false;
// Must include the broadcasted SN in the squash.
@ -880,10 +833,8 @@ DefaultIEW<Impl>::sortInsts()
{
int insts_from_rename = fromRename->size;
#ifdef DEBUG
#if !ISA_HAS_DELAY_SLOT
for (int i = 0; i < numThreads; i++)
assert(insts[i].empty());
#endif
#endif
for (int i = 0; i < insts_from_rename; ++i) {
insts[fromRename->insts[i]->threadNumber].push(fromRename->insts[i]);
@ -894,21 +845,9 @@ template <class Impl>
void
DefaultIEW<Impl>::emptyRenameInsts(unsigned tid)
{
DPRINTF(IEW, "[tid:%i]: Removing incoming rename instructions until "
"[sn:%i].\n", tid, bdelayDoneSeqNum[tid]);
DPRINTF(IEW, "[tid:%i]: Removing incoming rename instructions\n", tid);
while (!insts[tid].empty()) {
#if ISA_HAS_DELAY_SLOT
if (insts[tid].front()->seqNum <= bdelayDoneSeqNum[tid]) {
DPRINTF(IEW, "[tid:%i]: Done removing, cannot remove instruction"
" that occurs at or before delay slot [sn:%i].\n",
tid, bdelayDoneSeqNum[tid]);
break;
} else {
DPRINTF(IEW, "[tid:%i]: Removing incoming rename instruction "
"[sn:%i].\n", tid, insts[tid].front()->seqNum);
}
#endif
if (insts[tid].front()->isLoad() ||
insts[tid].front()->isStore() ) {

View file

@ -1005,11 +1005,7 @@ InstructionQueue<Impl>::squash(unsigned tid)
// Read instruction sequence number of last instruction out of the
// time buffer.
#if ISA_HAS_DELAY_SLOT
squashedSeqNum[tid] = fromCommit->commitInfo[tid].bdelayDoneSeqNum;
#else
squashedSeqNum[tid] = fromCommit->commitInfo[tid].doneSeqNum;
#endif
// Call doSquash if there are insts in the IQ
if (count[tid] > 0) {

View file

@ -69,10 +69,16 @@ class MipsDynInst : public BaseDynInst<Impl>
};
public:
/** BaseDynInst constructor given a binary instruction. */
MipsDynInst(StaticInstPtr staticInst,
Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu);
/** BaseDynInst constructor given a binary instruction. */
MipsDynInst(ExtMachInst inst,
Addr PC, Addr NPC,
Addr Pred_PC, Addr Pred_NPC,
Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu);
/** BaseDynInst constructor given a static inst pointer. */

View file

@ -31,11 +31,23 @@
#include "cpu/o3/mips/dyn_inst.hh"
template <class Impl>
MipsDynInst<Impl>::MipsDynInst(ExtMachInst inst,
Addr PC, Addr NPC,
Addr Pred_PC, Addr Pred_NPC,
MipsDynInst<Impl>::MipsDynInst(StaticInstPtr staticInst,
Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu)
: BaseDynInst<Impl>(inst, PC, NPC, Pred_PC, Pred_NPC, seq_num, cpu)
: BaseDynInst<Impl>(staticInst, PC, NPC, microPC,
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
{
initVars();
}
template <class Impl>
MipsDynInst<Impl>::MipsDynInst(ExtMachInst inst,
Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu)
: BaseDynInst<Impl>(inst, PC, NPC, microPC,
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
{
initVars();
}

View file

@ -179,7 +179,9 @@ class PhysRegFile
DPRINTF(IEW, "RegFile: Setting float register %i to %#x\n",
int(reg_idx), (uint64_t)val);
#if THE_ISA == ALPHA_ISA
if (reg_idx != TheISA::ZeroReg)
#endif
floatRegFile[reg_idx].d = val;
}
@ -194,7 +196,9 @@ class PhysRegFile
DPRINTF(IEW, "RegFile: Setting float register %i to %#x\n",
int(reg_idx), (uint64_t)val);
#if THE_ISA == ALPHA_ISA
if (reg_idx != TheISA::ZeroReg)
#endif
floatRegFile[reg_idx].d = val;
}

View file

@ -356,47 +356,12 @@ DefaultRename<Impl>::squash(const InstSeqNum &squash_seq_num, unsigned tid)
}
// Clear the instruction list and skid buffer in case they have any
// insts in them. Since we support multiple ISAs, we cant just:
// "insts[tid].clear();" or "skidBuffer[tid].clear()" since there is
// a possible delay slot inst for different architectures
// insts[tid].clear();
#if ISA_HAS_DELAY_SLOT
DPRINTF(Rename, "[tid:%i] Squashing incoming decode instructions until "
"[sn:%i].\n",tid, squash_seq_num);
ListIt ilist_it = insts[tid].begin();
while (ilist_it != insts[tid].end()) {
if ((*ilist_it)->seqNum > squash_seq_num) {
(*ilist_it)->setSquashed();
DPRINTF(Rename, "Squashing incoming decode instruction, "
"[tid:%i] [sn:%i] PC %08p.\n", tid, (*ilist_it)->seqNum, (*ilist_it)->PC);
}
ilist_it++;
}
#else
// insts in them.
insts[tid].clear();
#endif
// Clear the skid buffer in case it has any data in it.
// See comments above.
// skidBuffer[tid].clear();
#if ISA_HAS_DELAY_SLOT
DPRINTF(Rename, "[tid:%i] Squashing incoming skidbuffer instructions "
"until [sn:%i].\n", tid, squash_seq_num);
ListIt slist_it = skidBuffer[tid].begin();
while (slist_it != skidBuffer[tid].end()) {
if ((*slist_it)->seqNum > squash_seq_num) {
(*slist_it)->setSquashed();
DPRINTF(Rename, "Squashing skidbuffer instruction, [tid:%i] [sn:%i]"
"PC %08p.\n", tid, (*slist_it)->seqNum, (*slist_it)->PC);
}
slist_it++;
}
resumeUnblocking = (skidBuffer[tid].size() != 0);
DPRINTF(Rename, "Resume unblocking set to %s\n",
resumeUnblocking ? "true" : "false");
#else
skidBuffer[tid].clear();
#endif
doSquash(squash_seq_num, tid);
}
@ -776,10 +741,8 @@ DefaultRename<Impl>::sortInsts()
{
int insts_from_decode = fromDecode->size;
#ifdef DEBUG
#if !ISA_HAS_DELAY_SLOT
for (int i=0; i < numThreads; i++)
assert(insts[i].empty());
#endif
#endif
for (int i = 0; i < insts_from_decode; ++i) {
DynInstPtr inst = fromDecode->insts[i];
@ -1000,6 +963,7 @@ DefaultRename<Impl>::renameSrcRegs(DynInstPtr &inst,unsigned tid)
// Floating point and Miscellaneous registers need their indexes
// adjusted to account for the expanded number of flattened int regs.
flat_src_reg = src_reg - TheISA::FP_Base_DepTag + TheISA::NumIntRegs;
DPRINTF(Rename, "Adjusting reg index from %d to %d.\n", src_reg, flat_src_reg);
}
inst->flattenSrcReg(src_idx, flat_src_reg);
@ -1016,9 +980,11 @@ DefaultRename<Impl>::renameSrcRegs(DynInstPtr &inst,unsigned tid)
// See if the register is ready or not.
if (scoreboard->getReg(renamed_reg) == true) {
DPRINTF(Rename, "[tid:%u]: Register is ready.\n", tid);
DPRINTF(Rename, "[tid:%u]: Register %d is ready.\n", tid, renamed_reg);
inst->markSrcRegReady(src_idx);
} else {
DPRINTF(Rename, "[tid:%u]: Register %d is not ready.\n", tid, renamed_reg);
}
++renameRenameLookups;
@ -1045,6 +1011,7 @@ DefaultRename<Impl>::renameDestRegs(DynInstPtr &inst,unsigned tid)
// Floating point and Miscellaneous registers need their indexes
// adjusted to account for the expanded number of flattened int regs.
flat_dest_reg = dest_reg - TheISA::FP_Base_DepTag + TheISA::NumIntRegs;
DPRINTF(Rename, "Adjusting reg index from %d to %d.\n", dest_reg, flat_dest_reg);
}
inst->flattenDestReg(dest_idx, flat_dest_reg);
@ -1248,13 +1215,7 @@ DefaultRename<Impl>::checkSignalsAndUpdate(unsigned tid)
DPRINTF(Rename, "[tid:%u]: Squashing instructions due to squash from "
"commit.\n", tid);
#if ISA_HAS_DELAY_SLOT
InstSeqNum squashed_seq_num = fromCommit->commitInfo[tid].bdelayDoneSeqNum;
#else
InstSeqNum squashed_seq_num = fromCommit->commitInfo[tid].doneSeqNum;
#endif
squash(squashed_seq_num, tid);
squash(fromCommit->commitInfo[tid].doneSeqNum, tid);
return true;
}

View file

@ -165,17 +165,21 @@ SimpleRenameMap::rename(RegIndex arch_reg)
// If it's not referencing the zero register, then rename the
// register.
#if THE_ISA == ALPHA_ISA
if (arch_reg != floatZeroReg) {
#endif
renamed_reg = freeList->getFloatReg();
floatRenameMap[arch_reg].physical_reg = renamed_reg;
assert(renamed_reg < numPhysicalRegs &&
renamed_reg >= numPhysicalIntRegs);
#if THE_ISA == ALPHA_ISA
} else {
// Otherwise return the zero register so nothing bad happens.
renamed_reg = floatZeroReg;
}
#endif
} else {
// Subtract off the base offset for miscellaneous registers.
arch_reg = arch_reg - numLogicalRegs;

View file

@ -29,6 +29,7 @@
* Kevin Lim
*/
#include "arch/isa_specific.hh"
#include "cpu/o3/scoreboard.hh"
Scoreboard::Scoreboard(unsigned activeThreads,
@ -79,11 +80,18 @@ Scoreboard::name() const
bool
Scoreboard::getReg(PhysRegIndex phys_reg)
{
#if THE_ISA == ALPHA_ISA
// Always ready if int or fp zero reg.
if (phys_reg == zeroRegIdx ||
phys_reg == (zeroRegIdx + numPhysicalIntRegs)) {
return 1;
}
#else
// Always ready if int zero reg.
if (phys_reg == zeroRegIdx) {
return 1;
}
#endif
return regScoreBoard[phys_reg];
}
@ -99,11 +107,18 @@ Scoreboard::setReg(PhysRegIndex phys_reg)
void
Scoreboard::unsetReg(PhysRegIndex ready_reg)
{
#if THE_ISA == ALPHA_ISA
if (ready_reg == zeroRegIdx ||
ready_reg == (zeroRegIdx + numPhysicalIntRegs)) {
// Don't do anything if int or fp zero reg.
return;
}
#else
if (ready_reg == zeroRegIdx) {
// Don't do anything if int zero reg.
return;
}
#endif
regScoreBoard[ready_reg] = 0;
}

View file

@ -272,7 +272,10 @@ SparcO3CPU<Impl>::getSyscallArg(int i, int tid)
{
TheISA::IntReg idx = TheISA::flattenIntIndex(this->tcBase(tid),
SparcISA::ArgumentReg0 + i);
return this->readArchIntReg(idx, tid);
TheISA::IntReg val = this->readArchIntReg(idx, tid);
if (bits(this->readMiscRegNoEffect(SparcISA::MISCREG_PSTATE, tid), 3, 3))
val = bits(val, 31, 0);
return val;
}
template <class Impl>

View file

@ -56,8 +56,14 @@ class SparcDynInst : public BaseDynInst<Impl>
public:
/** BaseDynInst constructor given a binary instruction. */
SparcDynInst(TheISA::ExtMachInst inst, Addr PC, Addr NPC,
Addr Pred_PC, Addr Pred_NPC, InstSeqNum seq_num, O3CPU *cpu);
SparcDynInst(StaticInstPtr staticInst, Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu);
/** BaseDynInst constructor given a binary instruction. */
SparcDynInst(TheISA::ExtMachInst inst, Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu);
/** BaseDynInst constructor given a static inst pointer. */
SparcDynInst(StaticInstPtr &_staticInst);

View file

@ -31,10 +31,23 @@
#include "cpu/o3/sparc/dyn_inst.hh"
template <class Impl>
SparcDynInst<Impl>::SparcDynInst(TheISA::ExtMachInst inst,
Addr PC, Addr NPC, Addr Pred_PC, Addr Pred_NPC,
SparcDynInst<Impl>::SparcDynInst(StaticInstPtr staticInst,
Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu)
: BaseDynInst<Impl>(inst, PC, NPC, Pred_PC, Pred_NPC, seq_num, cpu)
: BaseDynInst<Impl>(staticInst, PC, NPC, microPC,
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
{
initVars();
}
template <class Impl>
SparcDynInst<Impl>::SparcDynInst(TheISA::ExtMachInst inst,
Addr PC, Addr NPC, Addr microPC,
Addr Pred_PC, Addr Pred_NPC, Addr Pred_MicroPC,
InstSeqNum seq_num, O3CPU *cpu)
: BaseDynInst<Impl>(inst, PC, NPC, microPC,
Pred_PC, Pred_NPC, Pred_MicroPC, seq_num, cpu)
{
initVars();
}

View file

@ -0,0 +1,391 @@
[root]
type=Root
children=system
dummy=0
[system]
type=System
children=cpu membus physmem
mem_mode=atomic
physmem=system.physmem
[system.cpu]
type=DerivO3CPU
children=dcache fuPool icache l2cache toL2Bus workload
BTBEntries=4096
BTBTagSize=16
LFSTSize=1024
LQEntries=32
RASSize=16
SQEntries=32
SSITSize=1024
activity=0
backComSize=5
cachePorts=200
choiceCtrBits=2
choicePredictorSize=8192
clock=500
commitToDecodeDelay=1
commitToFetchDelay=1
commitToIEWDelay=1
commitToRenameDelay=1
commitWidth=8
cpu_id=0
decodeToFetchDelay=1
decodeToRenameDelay=1
decodeWidth=8
defer_registration=false
dispatchWidth=8
fetchToDecodeDelay=1
fetchTrapLatency=1
fetchWidth=8
forwardComSize=5
fuPool=system.cpu.fuPool
function_trace=false
function_trace_start=0
globalCtrBits=2
globalHistoryBits=13
globalPredictorSize=8192
iewToCommitDelay=1
iewToDecodeDelay=1
iewToFetchDelay=1
iewToRenameDelay=1
instShiftAmt=2
issueToExecuteDelay=1
issueWidth=8
localCtrBits=2
localHistoryBits=11
localHistoryTableSize=2048
localPredictorSize=2048
max_insts_all_threads=0
max_insts_any_thread=0
max_loads_all_threads=0
max_loads_any_thread=0
numIQEntries=64
numPhysFloatRegs=256
numPhysIntRegs=256
numROBEntries=192
numRobs=1
numThreads=1
phase=0
predType=tournament
progress_interval=0
renameToDecodeDelay=1
renameToFetchDelay=1
renameToIEWDelay=2
renameToROBDelay=1
renameWidth=8
smtCommitPolicy=RoundRobin
smtFetchPolicy=SingleThread
smtIQPolicy=Partitioned
smtIQThreshold=100
smtLSQPolicy=Partitioned
smtLSQThreshold=100
smtNumFetchingThreads=1
smtROBPolicy=Partitioned
smtROBThreshold=100
squashWidth=8
system=system
trapLatency=13
wbDepth=1
wbWidth=8
workload=system.cpu.workload
dcache_port=system.cpu.dcache.cpu_side
icache_port=system.cpu.icache.cpu_side
[system.cpu.dcache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
compression_latency=0
hash_delay=1
latency=1000
lifo=false
max_miss_count=0
mshrs=10
prefetch_access=false
prefetch_cache_check_push=true
prefetch_data_accesses_only=false
prefetch_degree=1
prefetch_latency=10000
prefetch_miss=false
prefetch_past_page=false
prefetch_policy=none
prefetch_serial_squash=false
prefetch_use_cpu_id=true
prefetcher_size=100
prioritizeRequests=false
protocol=Null
repl=Null
size=262144
split=false
split_size=0
store_compressed=false
subblock_size=0
tgts_per_mshr=20
trace_addr=0
two_queue=false
write_buffers=8
cpu_side=system.cpu.dcache_port
mem_side=system.cpu.toL2Bus.port[1]
[system.cpu.fuPool]
type=FUPool
children=FUList0 FUList1 FUList2 FUList3 FUList4 FUList5 FUList6 FUList7
FUList=system.cpu.fuPool.FUList0 system.cpu.fuPool.FUList1 system.cpu.fuPool.FUList2 system.cpu.fuPool.FUList3 system.cpu.fuPool.FUList4 system.cpu.fuPool.FUList5 system.cpu.fuPool.FUList6 system.cpu.fuPool.FUList7
[system.cpu.fuPool.FUList0]
type=FUDesc
children=opList0
count=6
opList=system.cpu.fuPool.FUList0.opList0
[system.cpu.fuPool.FUList0.opList0]
type=OpDesc
issueLat=1
opClass=IntAlu
opLat=1
[system.cpu.fuPool.FUList1]
type=FUDesc
children=opList0 opList1
count=2
opList=system.cpu.fuPool.FUList1.opList0 system.cpu.fuPool.FUList1.opList1
[system.cpu.fuPool.FUList1.opList0]
type=OpDesc
issueLat=1
opClass=IntMult
opLat=3
[system.cpu.fuPool.FUList1.opList1]
type=OpDesc
issueLat=19
opClass=IntDiv
opLat=20
[system.cpu.fuPool.FUList2]
type=FUDesc
children=opList0 opList1 opList2
count=4
opList=system.cpu.fuPool.FUList2.opList0 system.cpu.fuPool.FUList2.opList1 system.cpu.fuPool.FUList2.opList2
[system.cpu.fuPool.FUList2.opList0]
type=OpDesc
issueLat=1
opClass=FloatAdd
opLat=2
[system.cpu.fuPool.FUList2.opList1]
type=OpDesc
issueLat=1
opClass=FloatCmp
opLat=2
[system.cpu.fuPool.FUList2.opList2]
type=OpDesc
issueLat=1
opClass=FloatCvt
opLat=2
[system.cpu.fuPool.FUList3]
type=FUDesc
children=opList0 opList1 opList2
count=2
opList=system.cpu.fuPool.FUList3.opList0 system.cpu.fuPool.FUList3.opList1 system.cpu.fuPool.FUList3.opList2
[system.cpu.fuPool.FUList3.opList0]
type=OpDesc
issueLat=1
opClass=FloatMult
opLat=4
[system.cpu.fuPool.FUList3.opList1]
type=OpDesc
issueLat=12
opClass=FloatDiv
opLat=12
[system.cpu.fuPool.FUList3.opList2]
type=OpDesc
issueLat=24
opClass=FloatSqrt
opLat=24
[system.cpu.fuPool.FUList4]
type=FUDesc
children=opList0
count=0
opList=system.cpu.fuPool.FUList4.opList0
[system.cpu.fuPool.FUList4.opList0]
type=OpDesc
issueLat=1
opClass=MemRead
opLat=1
[system.cpu.fuPool.FUList5]
type=FUDesc
children=opList0
count=0
opList=system.cpu.fuPool.FUList5.opList0
[system.cpu.fuPool.FUList5.opList0]
type=OpDesc
issueLat=1
opClass=MemWrite
opLat=1
[system.cpu.fuPool.FUList6]
type=FUDesc
children=opList0 opList1
count=4
opList=system.cpu.fuPool.FUList6.opList0 system.cpu.fuPool.FUList6.opList1
[system.cpu.fuPool.FUList6.opList0]
type=OpDesc
issueLat=1
opClass=MemRead
opLat=1
[system.cpu.fuPool.FUList6.opList1]
type=OpDesc
issueLat=1
opClass=MemWrite
opLat=1
[system.cpu.fuPool.FUList7]
type=FUDesc
children=opList0
count=1
opList=system.cpu.fuPool.FUList7.opList0
[system.cpu.fuPool.FUList7.opList0]
type=OpDesc
issueLat=3
opClass=IprAccess
opLat=3
[system.cpu.icache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
compression_latency=0
hash_delay=1
latency=1000
lifo=false
max_miss_count=0
mshrs=10
prefetch_access=false
prefetch_cache_check_push=true
prefetch_data_accesses_only=false
prefetch_degree=1
prefetch_latency=10000
prefetch_miss=false
prefetch_past_page=false
prefetch_policy=none
prefetch_serial_squash=false
prefetch_use_cpu_id=true
prefetcher_size=100
prioritizeRequests=false
protocol=Null
repl=Null
size=131072
split=false
split_size=0
store_compressed=false
subblock_size=0
tgts_per_mshr=20
trace_addr=0
two_queue=false
write_buffers=8
cpu_side=system.cpu.icache_port
mem_side=system.cpu.toL2Bus.port[0]
[system.cpu.l2cache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
compression_latency=0
hash_delay=1
latency=1000
lifo=false
max_miss_count=0
mshrs=10
prefetch_access=false
prefetch_cache_check_push=true
prefetch_data_accesses_only=false
prefetch_degree=1
prefetch_latency=10000
prefetch_miss=false
prefetch_past_page=false
prefetch_policy=none
prefetch_serial_squash=false
prefetch_use_cpu_id=true
prefetcher_size=100
prioritizeRequests=false
protocol=Null
repl=Null
size=2097152
split=false
split_size=0
store_compressed=false
subblock_size=0
tgts_per_mshr=5
trace_addr=0
two_queue=false
write_buffers=8
cpu_side=system.cpu.toL2Bus.port[2]
mem_side=system.membus.port[1]
[system.cpu.toL2Bus]
type=Bus
block_size=64
bus_id=0
clock=1000
responder_set=false
width=64
port=system.cpu.icache.mem_side system.cpu.dcache.mem_side system.cpu.l2cache.cpu_side
[system.cpu.workload]
type=LiveProcess
cmd=gzip input.log 1
cwd=build/SPARC_SE/tests/fast/long/00.gzip/sparc/linux/o3-timing
egid=100
env=
euid=100
executable=/dist/m5/cpu2000/binaries/sparc/linux/gzip
gid=100
input=cin
output=cout
pid=100
ppid=99
system=system
uid=100
[system.membus]
type=Bus
block_size=64
bus_id=0
clock=1000
responder_set=false
width=64
port=system.physmem.port[0] system.cpu.l2cache.mem_side
[system.physmem]
type=PhysicalMemory
file=
latency=1
range=0:134217727
zero=false
port=system.membus.port[0]

View file

@ -0,0 +1,366 @@
[root]
type=Root
dummy=0
[system.physmem]
type=PhysicalMemory
file=
range=[0,134217727]
latency=1
zero=false
[system]
type=System
physmem=system.physmem
mem_mode=atomic
[system.membus]
type=Bus
bus_id=0
clock=1000
width=64
responder_set=false
block_size=64
[system.cpu.workload]
type=LiveProcess
cmd=gzip input.log 1
executable=/dist/m5/cpu2000/binaries/sparc/linux/gzip
input=cin
output=cout
env=
cwd=build/SPARC_SE/tests/fast/long/00.gzip/sparc/linux/o3-timing
system=system
uid=100
euid=100
gid=100
egid=100
pid=100
ppid=99
[system.cpu.fuPool.FUList0.opList0]
type=OpDesc
opClass=IntAlu
opLat=1
issueLat=1
[system.cpu.fuPool.FUList0]
type=FUDesc
opList=system.cpu.fuPool.FUList0.opList0
count=6
[system.cpu.fuPool.FUList1.opList0]
type=OpDesc
opClass=IntMult
opLat=3
issueLat=1
[system.cpu.fuPool.FUList1.opList1]
type=OpDesc
opClass=IntDiv
opLat=20
issueLat=19
[system.cpu.fuPool.FUList1]
type=FUDesc
opList=system.cpu.fuPool.FUList1.opList0 system.cpu.fuPool.FUList1.opList1
count=2
[system.cpu.fuPool.FUList2.opList0]
type=OpDesc
opClass=FloatAdd
opLat=2
issueLat=1
[system.cpu.fuPool.FUList2.opList1]
type=OpDesc
opClass=FloatCmp
opLat=2
issueLat=1
[system.cpu.fuPool.FUList2.opList2]
type=OpDesc
opClass=FloatCvt
opLat=2
issueLat=1
[system.cpu.fuPool.FUList2]
type=FUDesc
opList=system.cpu.fuPool.FUList2.opList0 system.cpu.fuPool.FUList2.opList1 system.cpu.fuPool.FUList2.opList2
count=4
[system.cpu.fuPool.FUList3.opList0]
type=OpDesc
opClass=FloatMult
opLat=4
issueLat=1
[system.cpu.fuPool.FUList3.opList1]
type=OpDesc
opClass=FloatDiv
opLat=12
issueLat=12
[system.cpu.fuPool.FUList3.opList2]
type=OpDesc
opClass=FloatSqrt
opLat=24
issueLat=24
[system.cpu.fuPool.FUList3]
type=FUDesc
opList=system.cpu.fuPool.FUList3.opList0 system.cpu.fuPool.FUList3.opList1 system.cpu.fuPool.FUList3.opList2
count=2
[system.cpu.fuPool.FUList4.opList0]
type=OpDesc
opClass=MemRead
opLat=1
issueLat=1
[system.cpu.fuPool.FUList4]
type=FUDesc
opList=system.cpu.fuPool.FUList4.opList0
count=0
[system.cpu.fuPool.FUList5.opList0]
type=OpDesc
opClass=MemWrite
opLat=1
issueLat=1
[system.cpu.fuPool.FUList5]
type=FUDesc
opList=system.cpu.fuPool.FUList5.opList0
count=0
[system.cpu.fuPool.FUList6.opList0]
type=OpDesc
opClass=MemRead
opLat=1
issueLat=1
[system.cpu.fuPool.FUList6.opList1]
type=OpDesc
opClass=MemWrite
opLat=1
issueLat=1
[system.cpu.fuPool.FUList6]
type=FUDesc
opList=system.cpu.fuPool.FUList6.opList0 system.cpu.fuPool.FUList6.opList1
count=4
[system.cpu.fuPool.FUList7.opList0]
type=OpDesc
opClass=IprAccess
opLat=3
issueLat=3
[system.cpu.fuPool.FUList7]
type=FUDesc
opList=system.cpu.fuPool.FUList7.opList0
count=1
[system.cpu.fuPool]
type=FUPool
FUList=system.cpu.fuPool.FUList0 system.cpu.fuPool.FUList1 system.cpu.fuPool.FUList2 system.cpu.fuPool.FUList3 system.cpu.fuPool.FUList4 system.cpu.fuPool.FUList5 system.cpu.fuPool.FUList6 system.cpu.fuPool.FUList7
[system.cpu]
type=DerivO3CPU
clock=500
phase=0
numThreads=1
cpu_id=0
activity=0
workload=system.cpu.workload
checker=null
max_insts_any_thread=0
max_insts_all_threads=0
max_loads_any_thread=0
max_loads_all_threads=0
progress_interval=0
cachePorts=200
decodeToFetchDelay=1
renameToFetchDelay=1
iewToFetchDelay=1
commitToFetchDelay=1
fetchWidth=8
renameToDecodeDelay=1
iewToDecodeDelay=1
commitToDecodeDelay=1
fetchToDecodeDelay=1
decodeWidth=8
iewToRenameDelay=1
commitToRenameDelay=1
decodeToRenameDelay=1
renameWidth=8
commitToIEWDelay=1
renameToIEWDelay=2
issueToExecuteDelay=1
dispatchWidth=8
issueWidth=8
wbWidth=8
wbDepth=1
fuPool=system.cpu.fuPool
iewToCommitDelay=1
renameToROBDelay=1
commitWidth=8
squashWidth=8
trapLatency=13
backComSize=5
forwardComSize=5
predType=tournament
localPredictorSize=2048
localCtrBits=2
localHistoryTableSize=2048
localHistoryBits=11
globalPredictorSize=8192
globalCtrBits=2
globalHistoryBits=13
choicePredictorSize=8192
choiceCtrBits=2
BTBEntries=4096
BTBTagSize=16
RASSize=16
LQEntries=32
SQEntries=32
LFSTSize=1024
SSITSize=1024
numPhysIntRegs=256
numPhysFloatRegs=256
numIQEntries=64
numROBEntries=192
smtNumFetchingThreads=1
smtFetchPolicy=SingleThread
smtLSQPolicy=Partitioned
smtLSQThreshold=100
smtIQPolicy=Partitioned
smtIQThreshold=100
smtROBPolicy=Partitioned
smtROBThreshold=100
smtCommitPolicy=RoundRobin
instShiftAmt=2
defer_registration=false
function_trace=false
function_trace_start=0
[system.cpu.icache]
type=BaseCache
size=131072
assoc=2
block_size=64
latency=1000
mshrs=10
tgts_per_mshr=20
write_buffers=8
prioritizeRequests=false
protocol=null
trace_addr=0
hash_delay=1
repl=null
compressed_bus=false
store_compressed=false
adaptive_compression=false
compression_latency=0
block_size=64
max_miss_count=0
addr_range=[0,18446744073709551615]
split=false
split_size=0
lifo=false
two_queue=false
prefetch_miss=false
prefetch_access=false
prefetcher_size=100
prefetch_past_page=false
prefetch_serial_squash=false
prefetch_latency=10000
prefetch_degree=1
prefetch_policy=none
prefetch_cache_check_push=true
prefetch_use_cpu_id=true
prefetch_data_accesses_only=false
[system.cpu.dcache]
type=BaseCache
size=262144
assoc=2
block_size=64
latency=1000
mshrs=10
tgts_per_mshr=20
write_buffers=8
prioritizeRequests=false
protocol=null
trace_addr=0
hash_delay=1
repl=null
compressed_bus=false
store_compressed=false
adaptive_compression=false
compression_latency=0
block_size=64
max_miss_count=0
addr_range=[0,18446744073709551615]
split=false
split_size=0
lifo=false
two_queue=false
prefetch_miss=false
prefetch_access=false
prefetcher_size=100
prefetch_past_page=false
prefetch_serial_squash=false
prefetch_latency=10000
prefetch_degree=1
prefetch_policy=none
prefetch_cache_check_push=true
prefetch_use_cpu_id=true
prefetch_data_accesses_only=false
[system.cpu.l2cache]
type=BaseCache
size=2097152
assoc=2
block_size=64
latency=1000
mshrs=10
tgts_per_mshr=5
write_buffers=8
prioritizeRequests=false
protocol=null
trace_addr=0
hash_delay=1
repl=null
compressed_bus=false
store_compressed=false
adaptive_compression=false
compression_latency=0
block_size=64
max_miss_count=0
addr_range=[0,18446744073709551615]
split=false
split_size=0
lifo=false
two_queue=false
prefetch_miss=false
prefetch_access=false
prefetcher_size=100
prefetch_past_page=false
prefetch_serial_squash=false
prefetch_latency=10000
prefetch_degree=1
prefetch_policy=none
prefetch_cache_check_push=true
prefetch_use_cpu_id=true
prefetch_data_accesses_only=false
[system.cpu.toL2Bus]
type=Bus
bus_id=0
clock=1000
width=64
responder_set=false
block_size=64

View file

@ -0,0 +1,423 @@
---------- Begin Simulation Statistics ----------
global.BPredUnit.BTBCorrect 0 # Number of correct BTB predictions (this stat may not work properly.
global.BPredUnit.BTBHits 155497873 # Number of BTB hits
global.BPredUnit.BTBLookups 176569029 # Number of BTB lookups
global.BPredUnit.RASInCorrect 0 # Number of incorrect RAS predictions.
global.BPredUnit.condIncorrect 90327270 # Number of conditional branches incorrect
global.BPredUnit.condPredicted 223339092 # Number of conditional branches predicted
global.BPredUnit.lookups 223339092 # Number of BP lookups
global.BPredUnit.usedRAS 0 # Number of times the RAS was used to get a target.
host_inst_rate 54106 # Simulator instruction rate (inst/s)
host_mem_usage 156124 # Number of bytes of host memory used
host_seconds 27529.37 # Real time elapsed on the host
host_tick_rate 45674334 # Simulator tick rate (ticks/s)
memdepunit.memDep.conflictingLoads 464625781 # Number of conflicting loads.
memdepunit.memDep.conflictingStores 155659586 # Number of conflicting stores.
memdepunit.memDep.insertedLoads 751805606 # Number of loads inserted to the mem dependence unit.
memdepunit.memDep.insertedStores 305482201 # Number of stores inserted to the mem dependence unit.
sim_freq 1000000000000 # Frequency of simulated ticks
sim_insts 1489514762 # Number of instructions simulated
sim_seconds 1.257386 # Number of seconds simulated
sim_ticks 1257385552000 # Number of ticks simulated
system.cpu.commit.COM:branches 86246390 # Number of branches committed
system.cpu.commit.COM:bw_lim_events 9313657 # number cycles where commit BW limit reached
system.cpu.commit.COM:bw_limited 0 # number of insts not committed due to BW limits
system.cpu.commit.COM:committed_per_cycle.start_dist # Number of insts commited each cycle
system.cpu.commit.COM:committed_per_cycle.samples 2273477268
system.cpu.commit.COM:committed_per_cycle.min_value 0
0 1413600532 6217.79%
1 557883273 2453.88%
2 123364539 542.62%
3 120963543 532.06%
4 18884040 83.06%
5 12171132 53.54%
6 9965158 43.83%
7 7331394 32.25%
8 9313657 40.97%
system.cpu.commit.COM:committed_per_cycle.max_value 8
system.cpu.commit.COM:committed_per_cycle.end_dist
system.cpu.commit.COM:count 1489514762 # Number of instructions committed
system.cpu.commit.COM:loads 402511689 # Number of loads committed
system.cpu.commit.COM:membars 51356 # Number of memory barriers committed
system.cpu.commit.COM:refs 569359657 # Number of memory references committed
system.cpu.commit.COM:swp_count 0 # Number of s/w prefetches committed
system.cpu.commit.branchMispredicts 90327270 # The number of times a branch was mispredicted
system.cpu.commit.commitCommittedInsts 1489514762 # The number of committed instructions
system.cpu.commit.commitNonSpecStalls 2243499 # The number of times commit has been forced to stall to communicate backwards
system.cpu.commit.commitSquashedInsts 1399513618 # The number of squashed insts skipped by commit
system.cpu.committedInsts 1489514762 # Number of Instructions Simulated
system.cpu.committedInsts_total 1489514762 # Number of Instructions Simulated
system.cpu.cpi 1.688316 # CPI: Cycles Per Instruction
system.cpu.cpi_total 1.688316 # CPI: Total CPI of All Threads
system.cpu.dcache.ReadReq_accesses 431095835 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_avg_miss_latency 2842.252413 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency 2392.500580 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_hits 430168385 # number of ReadReq hits
system.cpu.dcache.ReadReq_miss_latency 2636047000 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_rate 0.002151 # miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_misses 927450 # number of ReadReq misses
system.cpu.dcache.ReadReq_mshr_hits 694672 # number of ReadReq MSHR hits
system.cpu.dcache.ReadReq_mshr_miss_latency 556921500 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_rate 0.000540 # mshr miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_mshr_misses 232778 # number of ReadReq MSHR misses
system.cpu.dcache.SwapReq_accesses 1326 # number of SwapReq accesses(hits+misses)
system.cpu.dcache.SwapReq_avg_miss_latency 3500 # average SwapReq miss latency
system.cpu.dcache.SwapReq_avg_mshr_miss_latency 2500 # average SwapReq mshr miss latency
system.cpu.dcache.SwapReq_hits 1319 # number of SwapReq hits
system.cpu.dcache.SwapReq_miss_latency 24500 # number of SwapReq miss cycles
system.cpu.dcache.SwapReq_miss_rate 0.005279 # miss rate for SwapReq accesses
system.cpu.dcache.SwapReq_misses 7 # number of SwapReq misses
system.cpu.dcache.SwapReq_mshr_miss_latency 17500 # number of SwapReq MSHR miss cycles
system.cpu.dcache.SwapReq_mshr_miss_rate 0.005279 # mshr miss rate for SwapReq accesses
system.cpu.dcache.SwapReq_mshr_misses 7 # number of SwapReq MSHR misses
system.cpu.dcache.WriteReq_accesses 166846642 # number of WriteReq accesses(hits+misses)
system.cpu.dcache.WriteReq_avg_miss_latency 3889.592412 # average WriteReq miss latency
system.cpu.dcache.WriteReq_avg_mshr_miss_latency 3171.120393 # average WriteReq mshr miss latency
system.cpu.dcache.WriteReq_hits 165155866 # number of WriteReq hits
system.cpu.dcache.WriteReq_miss_latency 6576429500 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_rate 0.010134 # miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_misses 1690776 # number of WriteReq misses
system.cpu.dcache.WriteReq_mshr_hits 1420478 # number of WriteReq MSHR hits
system.cpu.dcache.WriteReq_mshr_miss_latency 857147500 # number of WriteReq MSHR miss cycles
system.cpu.dcache.WriteReq_mshr_miss_rate 0.001620 # mshr miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_mshr_misses 270298 # number of WriteReq MSHR misses
system.cpu.dcache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.dcache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.dcache.avg_refs 1183.354576 # Average number of references to valid blocks.
system.cpu.dcache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.dcache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.dcache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.cache_copies 0 # number of cache copies performed
system.cpu.dcache.demand_accesses 597942477 # number of demand (read+write) accesses
system.cpu.dcache.demand_avg_miss_latency 3518.594842 # average overall miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency 2810.845677 # average overall mshr miss latency
system.cpu.dcache.demand_hits 595324251 # number of demand (read+write) hits
system.cpu.dcache.demand_miss_latency 9212476500 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_rate 0.004379 # miss rate for demand accesses
system.cpu.dcache.demand_misses 2618226 # number of demand (read+write) misses
system.cpu.dcache.demand_mshr_hits 2115150 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_miss_latency 1414069000 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_rate 0.000841 # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_misses 503076 # number of demand (read+write) MSHR misses
system.cpu.dcache.fast_writes 0 # number of fast writes performed
system.cpu.dcache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.dcache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.dcache.overall_accesses 597942477 # number of overall (read+write) accesses
system.cpu.dcache.overall_avg_miss_latency 3518.594842 # average overall miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency 2810.845677 # average overall mshr miss latency
system.cpu.dcache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.dcache.overall_hits 595324251 # number of overall hits
system.cpu.dcache.overall_miss_latency 9212476500 # number of overall miss cycles
system.cpu.dcache.overall_miss_rate 0.004379 # miss rate for overall accesses
system.cpu.dcache.overall_misses 2618226 # number of overall misses
system.cpu.dcache.overall_mshr_hits 2115150 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_miss_latency 1414069000 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_rate 0.000841 # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_misses 503076 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.dcache.overall_mshr_uncacheable_misses 0 # number of overall MSHR uncacheable misses
system.cpu.dcache.prefetcher.num_hwpf_already_in_cache 0 # number of hwpf that were already in the cache
system.cpu.dcache.prefetcher.num_hwpf_already_in_mshr 0 # number of hwpf that were already in mshr
system.cpu.dcache.prefetcher.num_hwpf_already_in_prefetcher 0 # number of hwpf that were already in the prefetch queue
system.cpu.dcache.prefetcher.num_hwpf_evicted 0 # number of hwpf removed due to no buffer left
system.cpu.dcache.prefetcher.num_hwpf_identified 0 # number of hwpf identified
system.cpu.dcache.prefetcher.num_hwpf_issued 0 # number of hwpf issued
system.cpu.dcache.prefetcher.num_hwpf_removed_MSHR_hit 0 # number of hwpf removed because MSHR allocated
system.cpu.dcache.prefetcher.num_hwpf_span_page 0 # number of hwpf spanning a virtual page
system.cpu.dcache.prefetcher.num_hwpf_squashed_from_miss 0 # number of hwpf that got squashed due to a miss aborting calculation time
system.cpu.dcache.replacements 498987 # number of replacements
system.cpu.dcache.sampled_refs 503083 # Sample count of references to valid blocks.
system.cpu.dcache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.dcache.tagsinuse 4095.797134 # Cycle average of tags in use
system.cpu.dcache.total_refs 595325570 # Total number of references to valid blocks.
system.cpu.dcache.warmup_cycle 77974000 # Cycle when the warmup percentage was hit.
system.cpu.dcache.writebacks 335737 # number of writebacks
system.cpu.decode.DECODE:BlockedCycles 435745843 # Number of cycles decode is blocked
system.cpu.decode.DECODE:DecodedInsts 3276032607 # Number of instructions handled by decode
system.cpu.decode.DECODE:IdleCycles 1073744654 # Number of cycles decode is idle
system.cpu.decode.DECODE:RunCycles 761619600 # Number of cycles decode is running
system.cpu.decode.DECODE:SquashCycles 241293837 # Number of cycles decode is squashing
system.cpu.decode.DECODE:UnblockCycles 2367171 # Number of cycles decode is unblocking
system.cpu.fetch.Branches 223339092 # Number of branches that fetch encountered
system.cpu.fetch.CacheLines 355860305 # Number of cache lines fetched
system.cpu.fetch.Cycles 1166695920 # Number of cycles fetch has run and was not squashing or blocked
system.cpu.fetch.IcacheSquashes 14770227 # Number of outstanding Icache misses that were squashed
system.cpu.fetch.Insts 3591774268 # Number of instructions fetch has processed
system.cpu.fetch.SquashCycles 93734364 # Number of cycles fetch has spent squashing
system.cpu.fetch.branchRate 0.088811 # Number of branch fetches per cycle
system.cpu.fetch.icacheStallCycles 355860305 # Number of cycles fetch is stalled on an Icache miss
system.cpu.fetch.predictedBranches 155497873 # Number of branches that fetch has predicted taken
system.cpu.fetch.rate 1.428271 # Number of inst fetches per cycle
system.cpu.fetch.rateDist.start_dist # Number of instructions fetched each cycle (Total)
system.cpu.fetch.rateDist.samples 2514771105
system.cpu.fetch.rateDist.min_value 0
0 1703935491 6775.71%
1 252157679 1002.71%
2 75632424 300.75%
3 38096592 151.49%
4 76680653 304.92%
5 30840750 122.64%
6 33076966 131.53%
7 20130593 80.05%
8 284219957 1130.20%
system.cpu.fetch.rateDist.max_value 8
system.cpu.fetch.rateDist.end_dist
system.cpu.icache.ReadReq_accesses 355860305 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_avg_miss_latency 5111.111111 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency 4198.640483 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_hits 355858946 # number of ReadReq hits
system.cpu.icache.ReadReq_miss_latency 6946000 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_rate 0.000004 # miss rate for ReadReq accesses
system.cpu.icache.ReadReq_misses 1359 # number of ReadReq misses
system.cpu.icache.ReadReq_mshr_hits 35 # number of ReadReq MSHR hits
system.cpu.icache.ReadReq_mshr_miss_latency 5559000 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_rate 0.000004 # mshr miss rate for ReadReq accesses
system.cpu.icache.ReadReq_mshr_misses 1324 # number of ReadReq MSHR misses
system.cpu.icache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.icache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.icache.avg_refs 268775.638973 # Average number of references to valid blocks.
system.cpu.icache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.icache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.icache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.icache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.icache.cache_copies 0 # number of cache copies performed
system.cpu.icache.demand_accesses 355860305 # number of demand (read+write) accesses
system.cpu.icache.demand_avg_miss_latency 5111.111111 # average overall miss latency
system.cpu.icache.demand_avg_mshr_miss_latency 4198.640483 # average overall mshr miss latency
system.cpu.icache.demand_hits 355858946 # number of demand (read+write) hits
system.cpu.icache.demand_miss_latency 6946000 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_rate 0.000004 # miss rate for demand accesses
system.cpu.icache.demand_misses 1359 # number of demand (read+write) misses
system.cpu.icache.demand_mshr_hits 35 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_miss_latency 5559000 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_rate 0.000004 # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_misses 1324 # number of demand (read+write) MSHR misses
system.cpu.icache.fast_writes 0 # number of fast writes performed
system.cpu.icache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.icache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.icache.overall_accesses 355860305 # number of overall (read+write) accesses
system.cpu.icache.overall_avg_miss_latency 5111.111111 # average overall miss latency
system.cpu.icache.overall_avg_mshr_miss_latency 4198.640483 # average overall mshr miss latency
system.cpu.icache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.icache.overall_hits 355858946 # number of overall hits
system.cpu.icache.overall_miss_latency 6946000 # number of overall miss cycles
system.cpu.icache.overall_miss_rate 0.000004 # miss rate for overall accesses
system.cpu.icache.overall_misses 1359 # number of overall misses
system.cpu.icache.overall_mshr_hits 35 # number of overall MSHR hits
system.cpu.icache.overall_mshr_miss_latency 5559000 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_rate 0.000004 # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_misses 1324 # number of overall MSHR misses
system.cpu.icache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.icache.overall_mshr_uncacheable_misses 0 # number of overall MSHR uncacheable misses
system.cpu.icache.prefetcher.num_hwpf_already_in_cache 0 # number of hwpf that were already in the cache
system.cpu.icache.prefetcher.num_hwpf_already_in_mshr 0 # number of hwpf that were already in mshr
system.cpu.icache.prefetcher.num_hwpf_already_in_prefetcher 0 # number of hwpf that were already in the prefetch queue
system.cpu.icache.prefetcher.num_hwpf_evicted 0 # number of hwpf removed due to no buffer left
system.cpu.icache.prefetcher.num_hwpf_identified 0 # number of hwpf identified
system.cpu.icache.prefetcher.num_hwpf_issued 0 # number of hwpf issued
system.cpu.icache.prefetcher.num_hwpf_removed_MSHR_hit 0 # number of hwpf removed because MSHR allocated
system.cpu.icache.prefetcher.num_hwpf_span_page 0 # number of hwpf spanning a virtual page
system.cpu.icache.prefetcher.num_hwpf_squashed_from_miss 0 # number of hwpf that got squashed due to a miss aborting calculation time
system.cpu.icache.replacements 198 # number of replacements
system.cpu.icache.sampled_refs 1324 # Sample count of references to valid blocks.
system.cpu.icache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.icache.tagsinuse 1026.431065 # Cycle average of tags in use
system.cpu.icache.total_refs 355858946 # Total number of references to valid blocks.
system.cpu.icache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.icache.writebacks 0 # number of writebacks
system.cpu.idleCycles 1497 # Total number of cycles that the CPU has spent unscheduled due to idling
system.cpu.iew.EXEC:branches 128998684 # Number of branches executed
system.cpu.iew.EXEC:nop 0 # number of nop insts executed
system.cpu.iew.EXEC:rate 0.879999 # Inst execution rate
system.cpu.iew.EXEC:refs 756340485 # number of memory reference insts executed
system.cpu.iew.EXEC:stores 208683785 # Number of stores executed
system.cpu.iew.EXEC:swp 0 # number of swp insts executed
system.cpu.iew.WB:consumers 1511846593 # num instructions consuming a value
system.cpu.iew.WB:count 2184193190 # cumulative count of insts written-back
system.cpu.iew.WB:fanout 0.964010 # average fanout of values written-back
system.cpu.iew.WB:penalized 0 # number of instrctions required to write to 'other' IQ
system.cpu.iew.WB:penalized_rate 0 # fraction of instructions written-back that wrote to 'other' IQ
system.cpu.iew.WB:producers 1457435157 # num instructions producing a value
system.cpu.iew.WB:rate 0.868546 # insts written-back per cycle
system.cpu.iew.WB:sent 2194556483 # cumulative count of insts sent to commit
system.cpu.iew.branchMispredicts 93921260 # Number of branch mispredicts detected at execute
system.cpu.iew.iewBlockCycles 242324 # Number of cycles IEW is blocking
system.cpu.iew.iewDispLoadInsts 751805606 # Number of dispatched load instructions
system.cpu.iew.iewDispNonSpecInsts 21112863 # Number of dispatched non-speculative instructions
system.cpu.iew.iewDispSquashedInsts 6967923 # Number of squashed instructions skipped by dispatch
system.cpu.iew.iewDispStoreInsts 305482201 # Number of dispatched store instructions
system.cpu.iew.iewDispatchedInsts 2889028359 # Number of instructions dispatched to IQ
system.cpu.iew.iewExecLoadInsts 547656700 # Number of load instructions executed
system.cpu.iew.iewExecSquashedInsts 155922171 # Number of squashed instructions skipped in execute
system.cpu.iew.iewExecutedInsts 2212995141 # Number of executed instructions
system.cpu.iew.iewIQFullEvents 0 # Number of times the IQ has become full, causing a stall
system.cpu.iew.iewIdleCycles 0 # Number of cycles IEW is idle
system.cpu.iew.iewLSQFullEvents 0 # Number of times the LSQ has become full, causing a stall
system.cpu.iew.iewSquashCycles 241293837 # Number of cycles IEW is squashing
system.cpu.iew.iewUnblockCycles 1173 # Number of cycles IEW is unblocking
system.cpu.iew.lsq.thread.0.blockedLoads 0 # Number of blocked loads due to partial load-store forwarding
system.cpu.iew.lsq.thread.0.cacheBlocked 0 # Number of times an access to memory failed due to the cache being blocked
system.cpu.iew.lsq.thread.0.forwLoads 116560202 # Number of loads that had data forwarded from stores
system.cpu.iew.lsq.thread.0.ignoredResponses 586068 # Number of memory responses ignored because the instruction is squashed
system.cpu.iew.lsq.thread.0.invAddrLoads 0 # Number of loads ignored due to an invalid address
system.cpu.iew.lsq.thread.0.invAddrSwpfs 0 # Number of software prefetches ignored due to an invalid address
system.cpu.iew.lsq.thread.0.memOrderViolation 3827981 # Number of memory ordering violations
system.cpu.iew.lsq.thread.0.rescheduledLoads 59 # Number of loads that were rescheduled
system.cpu.iew.lsq.thread.0.squashedLoads 349293917 # Number of loads squashed
system.cpu.iew.lsq.thread.0.squashedStores 138634233 # Number of stores squashed
system.cpu.iew.memOrderViolationEvents 3827981 # Number of memory order violations
system.cpu.iew.predictedNotTakenIncorrect 1127857 # Number of branches that were predicted not taken incorrectly
system.cpu.iew.predictedTakenIncorrect 92793403 # Number of branches that were predicted taken incorrectly
system.cpu.ipc 0.592306 # IPC: Instructions Per Cycle
system.cpu.ipc_total 0.592306 # IPC: Total IPC of All Threads
system.cpu.iq.ISSUE:FU_type_0 2368917312 # Type of FU issued
system.cpu.iq.ISSUE:FU_type_0.start_dist
No_OpClass 351375247 14.83% # Type of FU issued
IntAlu 1188705257 50.18% # Type of FU issued
IntMult 0 0.00% # Type of FU issued
IntDiv 0 0.00% # Type of FU issued
FloatAdd 2951238 0.12% # Type of FU issued
FloatCmp 0 0.00% # Type of FU issued
FloatCvt 0 0.00% # Type of FU issued
FloatMult 0 0.00% # Type of FU issued
FloatDiv 0 0.00% # Type of FU issued
FloatSqrt 0 0.00% # Type of FU issued
MemRead 592531661 25.01% # Type of FU issued
MemWrite 233353909 9.85% # Type of FU issued
IprAccess 0 0.00% # Type of FU issued
InstPrefetch 0 0.00% # Type of FU issued
system.cpu.iq.ISSUE:FU_type_0.end_dist
system.cpu.iq.ISSUE:fu_busy_cnt 6622922 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_rate 0.002796 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_full.start_dist
No_OpClass 0 0.00% # attempts to use FU when none available
IntAlu 3150287 47.57% # attempts to use FU when none available
IntMult 0 0.00% # attempts to use FU when none available
IntDiv 0 0.00% # attempts to use FU when none available
FloatAdd 202242 3.05% # attempts to use FU when none available
FloatCmp 0 0.00% # attempts to use FU when none available
FloatCvt 0 0.00% # attempts to use FU when none available
FloatMult 0 0.00% # attempts to use FU when none available
FloatDiv 0 0.00% # attempts to use FU when none available
FloatSqrt 0 0.00% # attempts to use FU when none available
MemRead 2975364 44.93% # attempts to use FU when none available
MemWrite 295029 4.45% # attempts to use FU when none available
IprAccess 0 0.00% # attempts to use FU when none available
InstPrefetch 0 0.00% # attempts to use FU when none available
system.cpu.iq.ISSUE:fu_full.end_dist
system.cpu.iq.ISSUE:issued_per_cycle.start_dist # Number of insts issued each cycle
system.cpu.iq.ISSUE:issued_per_cycle.samples 2514771105
system.cpu.iq.ISSUE:issued_per_cycle.min_value 0
0 1264571415 5028.57%
1 618163663 2458.13%
2 318214573 1265.38%
3 195947630 779.19%
4 78232851 311.09%
5 28085074 111.68%
6 8167595 32.48%
7 2987163 11.88%
8 401141 1.60%
system.cpu.iq.ISSUE:issued_per_cycle.max_value 8
system.cpu.iq.ISSUE:issued_per_cycle.end_dist
system.cpu.iq.ISSUE:rate 0.942001 # Inst issue rate
system.cpu.iq.iqInstsAdded 2867645475 # Number of instructions added to the IQ (excludes non-spec)
system.cpu.iq.iqInstsIssued 2368917312 # Number of instructions issued
system.cpu.iq.iqNonSpecInstsAdded 21382884 # Number of non-speculative instructions added to the IQ
system.cpu.iq.iqSquashedInstsExamined 1368214032 # Number of squashed instructions iterated over during squash; mainly for profiling
system.cpu.iq.iqSquashedInstsIssued 461256 # Number of squashed instructions issued
system.cpu.iq.iqSquashedNonSpecRemoved 19139385 # Number of squashed non-spec instructions that were removed
system.cpu.iq.iqSquashedOperandsExamined 1296493196 # Number of squashed operands that are examined and possibly removed from graph
system.cpu.l2cache.ReadReq_accesses 504406 # number of ReadReq accesses(hits+misses)
system.cpu.l2cache.ReadReq_avg_miss_latency 4393.799833 # average ReadReq miss latency
system.cpu.l2cache.ReadReq_avg_mshr_miss_latency 2267.430007 # average ReadReq mshr miss latency
system.cpu.l2cache.ReadReq_hits 476939 # number of ReadReq hits
system.cpu.l2cache.ReadReq_miss_latency 120684500 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_rate 0.054454 # miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_misses 27467 # number of ReadReq misses
system.cpu.l2cache.ReadReq_mshr_miss_latency 62279500 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_rate 0.054454 # mshr miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_mshr_misses 27467 # number of ReadReq MSHR misses
system.cpu.l2cache.Writeback_accesses 335737 # number of Writeback accesses(hits+misses)
system.cpu.l2cache.Writeback_hits 335720 # number of Writeback hits
system.cpu.l2cache.Writeback_miss_rate 0.000051 # miss rate for Writeback accesses
system.cpu.l2cache.Writeback_misses 17 # number of Writeback misses
system.cpu.l2cache.Writeback_mshr_miss_rate 0.000051 # mshr miss rate for Writeback accesses
system.cpu.l2cache.Writeback_mshr_misses 17 # number of Writeback MSHR misses
system.cpu.l2cache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.l2cache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.l2cache.avg_refs 29.586740 # Average number of references to valid blocks.
system.cpu.l2cache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.l2cache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.l2cache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.l2cache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.l2cache.cache_copies 0 # number of cache copies performed
system.cpu.l2cache.demand_accesses 504406 # number of demand (read+write) accesses
system.cpu.l2cache.demand_avg_miss_latency 4393.799833 # average overall miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency 2267.430007 # average overall mshr miss latency
system.cpu.l2cache.demand_hits 476939 # number of demand (read+write) hits
system.cpu.l2cache.demand_miss_latency 120684500 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_rate 0.054454 # miss rate for demand accesses
system.cpu.l2cache.demand_misses 27467 # number of demand (read+write) misses
system.cpu.l2cache.demand_mshr_hits 0 # number of demand (read+write) MSHR hits
system.cpu.l2cache.demand_mshr_miss_latency 62279500 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_rate 0.054454 # mshr miss rate for demand accesses
system.cpu.l2cache.demand_mshr_misses 27467 # number of demand (read+write) MSHR misses
system.cpu.l2cache.fast_writes 0 # number of fast writes performed
system.cpu.l2cache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.l2cache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.l2cache.overall_accesses 840143 # number of overall (read+write) accesses
system.cpu.l2cache.overall_avg_miss_latency 4391.082084 # average overall miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency 2267.430007 # average overall mshr miss latency
system.cpu.l2cache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.l2cache.overall_hits 812659 # number of overall hits
system.cpu.l2cache.overall_miss_latency 120684500 # number of overall miss cycles
system.cpu.l2cache.overall_miss_rate 0.032713 # miss rate for overall accesses
system.cpu.l2cache.overall_misses 27484 # number of overall misses
system.cpu.l2cache.overall_mshr_hits 0 # number of overall MSHR hits
system.cpu.l2cache.overall_mshr_miss_latency 62279500 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_rate 0.032693 # mshr miss rate for overall accesses
system.cpu.l2cache.overall_mshr_misses 27467 # number of overall MSHR misses
system.cpu.l2cache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.l2cache.overall_mshr_uncacheable_misses 0 # number of overall MSHR uncacheable misses
system.cpu.l2cache.prefetcher.num_hwpf_already_in_cache 0 # number of hwpf that were already in the cache
system.cpu.l2cache.prefetcher.num_hwpf_already_in_mshr 0 # number of hwpf that were already in mshr
system.cpu.l2cache.prefetcher.num_hwpf_already_in_prefetcher 0 # number of hwpf that were already in the prefetch queue
system.cpu.l2cache.prefetcher.num_hwpf_evicted 0 # number of hwpf removed due to no buffer left
system.cpu.l2cache.prefetcher.num_hwpf_identified 0 # number of hwpf identified
system.cpu.l2cache.prefetcher.num_hwpf_issued 0 # number of hwpf issued
system.cpu.l2cache.prefetcher.num_hwpf_removed_MSHR_hit 0 # number of hwpf removed because MSHR allocated
system.cpu.l2cache.prefetcher.num_hwpf_span_page 0 # number of hwpf spanning a virtual page
system.cpu.l2cache.prefetcher.num_hwpf_squashed_from_miss 0 # number of hwpf that got squashed due to a miss aborting calculation time
system.cpu.l2cache.replacements 2692 # number of replacements
system.cpu.l2cache.sampled_refs 27467 # Sample count of references to valid blocks.
system.cpu.l2cache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.l2cache.tagsinuse 24466.224839 # Cycle average of tags in use
system.cpu.l2cache.total_refs 812659 # Total number of references to valid blocks.
system.cpu.l2cache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.l2cache.writebacks 2555 # number of writebacks
system.cpu.numCycles 2514771105 # number of cpu cycles simulated
system.cpu.rename.RENAME:BlockCycles 14153952 # Number of cycles rename is blocking
system.cpu.rename.RENAME:CommittedMaps 1244762263 # Number of HB maps that are committed
system.cpu.rename.RENAME:IQFullEvents 845 # Number of times rename has blocked due to IQ full
system.cpu.rename.RENAME:IdleCycles 1122858502 # Number of cycles rename is idle
system.cpu.rename.RENAME:LSQFullEvents 18964355 # Number of times rename has blocked due to LSQ full
system.cpu.rename.RENAME:RenameLookups 4974059876 # Number of register rename lookups that rename has made
system.cpu.rename.RENAME:RenamedInsts 3105364972 # Number of instructions processed by rename
system.cpu.rename.RENAME:RenamedOperands 2435580679 # Number of destination operands rename has renamed
system.cpu.rename.RENAME:RunCycles 713636177 # Number of cycles rename is running
system.cpu.rename.RENAME:SquashCycles 241293837 # Number of cycles rename is squashing
system.cpu.rename.RENAME:UnblockCycles 24303898 # Number of cycles rename is unblocking
system.cpu.rename.RENAME:UndoneMaps 1190818416 # Number of HB maps that are undone due to squashing
system.cpu.rename.RENAME:serializeStallCycles 398524739 # count of cycles rename stalled for serializing inst
system.cpu.rename.RENAME:serializingInsts 21495577 # count of serializing insts renamed
system.cpu.rename.RENAME:skidInsts 149561373 # count of insts added to the skid buffer
system.cpu.rename.RENAME:tempSerializingInsts 21338548 # count of temporary serializing insts renamed
system.cpu.timesIdled 3 # Number of times that the entire CPU went into an idle state and unscheduled itself
system.cpu.workload.PROG:num_syscalls 19 # Number of system calls
---------- End Simulation Statistics ----------

View file

@ -0,0 +1,6 @@
warn: More than two loadable segments in ELF object.
warn: Ignoring segment @ 0xb4000 length 0x10.
warn: More than two loadable segments in ELF object.
warn: Ignoring segment @ 0x0 length 0x0.
warn: Entering event queue @ 0. Starting simulation...
warn: Ignoring request to flush register windows.

View file

@ -0,0 +1,44 @@
spec_init
Loading Input Data
Duplicating 262144 bytes
Duplicating 524288 bytes
Input data 1048576 bytes in length
Compressing Input Data, level 1
Compressed data 108074 bytes in length
Uncompressing Data
Uncompressed data 1048576 bytes in length
Uncompressed data compared correctly
Compressing Input Data, level 3
Compressed data 97831 bytes in length
Uncompressing Data
Uncompressed data 1048576 bytes in length
Uncompressed data compared correctly
Compressing Input Data, level 5
Compressed data 83382 bytes in length
Uncompressing Data
Uncompressed data 1048576 bytes in length
Uncompressed data compared correctly
Compressing Input Data, level 7
Compressed data 76606 bytes in length
Uncompressing Data
Uncompressed data 1048576 bytes in length
Uncompressed data compared correctly
Compressing Input Data, level 9
Compressed data 73189 bytes in length
Uncompressing Data
Uncompressed data 1048576 bytes in length
Uncompressed data compared correctly
Tested 1MB buffer: OK!
M5 Simulator System
Copyright (c) 2001-2006
The Regents of The University of Michigan
All Rights Reserved
M5 compiled Jun 21 2007 21:15:48
M5 started Fri Jun 22 01:01:27 2007
M5 executing on zizzer.eecs.umich.edu
command line: build/SPARC_SE/m5.fast -d build/SPARC_SE/tests/fast/long/00.gzip/sparc/linux/o3-timing tests/run.py long/00.gzip/sparc/linux/o3-timing
Global frequency set at 1000000000000 ticks per second
Exiting @ tick 1257385552000 because target called exit()

View file

@ -39,7 +39,7 @@ env=
euid=100
executable=/dist/m5/cpu2000/binaries/sparc/linux/mcf
gid=100
input=/dist/m5/cpu2000/data/mcf/lgred/input/mcf.in
input=/dist/m5/cpu2000/data/mcf/smred/input/mcf.in
output=cout
pid=100
ppid=99
@ -53,7 +53,7 @@ bus_id=0
clock=1000
responder_set=false
width=64
port=system.physmem.port system.cpu.icache_port system.cpu.dcache_port
port=system.physmem.port[0] system.cpu.icache_port system.cpu.dcache_port
[system.physmem]
type=PhysicalMemory

View file

@ -26,7 +26,7 @@ block_size=64
type=LiveProcess
cmd=mcf mcf.in
executable=/dist/m5/cpu2000/binaries/sparc/linux/mcf
input=/dist/m5/cpu2000/data/mcf/lgred/input/mcf.in
input=/dist/m5/cpu2000/data/mcf/smred/input/mcf.in
output=cout
env=
cwd=build/SPARC_SE/tests/fast/long/10.mcf/sparc/linux/simple-atomic

View file

@ -1,18 +1,18 @@
---------- Begin Simulation Statistics ----------
host_inst_rate 686638 # Simulator instruction rate (inst/s)
host_mem_usage 149820 # Number of bytes of host memory used
host_seconds 2504.37 # Real time elapsed on the host
host_tick_rate 343319148 # Simulator tick rate (ticks/s)
host_inst_rate 1151751 # Simulator instruction rate (inst/s)
host_mem_usage 150484 # Number of bytes of host memory used
host_seconds 211.71 # Real time elapsed on the host
host_tick_rate 575874246 # Simulator tick rate (ticks/s)
sim_freq 1000000000000 # Frequency of simulated ticks
sim_insts 1719594534 # Number of instructions simulated
sim_seconds 0.859797 # Number of seconds simulated
sim_ticks 859797266500 # Number of ticks simulated
sim_insts 243840172 # Number of instructions simulated
sim_seconds 0.121920 # Number of seconds simulated
sim_ticks 121920085500 # Number of ticks simulated
system.cpu.idle_fraction 0 # Percentage of idle cycles
system.cpu.not_idle_fraction 1 # Percentage of non-idle cycles
system.cpu.numCycles 1719594534 # number of cpu cycles simulated
system.cpu.num_insts 1719594534 # Number of instructions executed
system.cpu.num_refs 774793634 # Number of memory references
system.cpu.workload.PROG:num_syscalls 632 # Number of system calls
system.cpu.numCycles 243840172 # number of cpu cycles simulated
system.cpu.num_insts 243840172 # Number of instructions executed
system.cpu.num_refs 105125191 # Number of memory references
system.cpu.workload.PROG:num_syscalls 428 # Number of system calls
---------- End Simulation Statistics ----------

File diff suppressed because it is too large Load diff

View file

@ -4,19 +4,15 @@ by Andreas Loebel
Copyright (c) 1998,1999 ZIB Berlin
All Rights Reserved.
nodes : 1800
active arcs : 8190
simplex iterations : 6837
flow value : 12860044181
new implicit arcs : 300000
active arcs : 308190
simplex iterations : 11843
flow value : 9360043604
new implicit arcs : 22787
active arcs : 330977
simplex iterations : 11931
flow value : 9360043512
checksum : 798014
nodes : 500
active arcs : 1905
simplex iterations : 1502
flow value : 4990014995
new implicit arcs : 23867
active arcs : 25772
simplex iterations : 2663
flow value : 3080014995
checksum : 68389
optimal
M5 Simulator System
@ -25,9 +21,9 @@ The Regents of The University of Michigan
All Rights Reserved
M5 compiled May 15 2007 13:02:31
M5 started Tue May 15 14:23:47 2007
M5 compiled Jun 21 2007 21:15:48
M5 started Fri Jun 22 01:58:18 2007
M5 executing on zizzer.eecs.umich.edu
command line: build/SPARC_SE/m5.fast -d build/SPARC_SE/tests/fast/long/10.mcf/sparc/linux/simple-atomic tests/run.py long/10.mcf/sparc/linux/simple-atomic
Global frequency set at 1000000000000 ticks per second
Exiting @ tick 859797266500 because target called exit()
Exiting @ tick 121920085500 because target called exit()

View file

@ -31,6 +31,7 @@ icache_port=system.cpu.icache.cpu_side
[system.cpu.dcache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -44,7 +45,7 @@ prefetch_access=false
prefetch_cache_check_push=true
prefetch_data_accesses_only=false
prefetch_degree=1
prefetch_latency=10
prefetch_latency=10000
prefetch_miss=false
prefetch_past_page=false
prefetch_policy=none
@ -69,6 +70,7 @@ mem_side=system.cpu.toL2Bus.port[1]
[system.cpu.icache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -82,7 +84,7 @@ prefetch_access=false
prefetch_cache_check_push=true
prefetch_data_accesses_only=false
prefetch_degree=1
prefetch_latency=10
prefetch_latency=10000
prefetch_miss=false
prefetch_past_page=false
prefetch_policy=none
@ -107,6 +109,7 @@ mem_side=system.cpu.toL2Bus.port[0]
[system.cpu.l2cache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -120,7 +123,7 @@ prefetch_access=false
prefetch_cache_check_push=true
prefetch_data_accesses_only=false
prefetch_degree=1
prefetch_latency=10
prefetch_latency=100000
prefetch_miss=false
prefetch_past_page=false
prefetch_policy=none
@ -160,7 +163,7 @@ env=
euid=100
executable=/dist/m5/cpu2000/binaries/sparc/linux/mcf
gid=100
input=/dist/m5/cpu2000/data/mcf/lgred/input/mcf.in
input=/dist/m5/cpu2000/data/mcf/smred/input/mcf.in
output=cout
pid=100
ppid=99
@ -174,7 +177,7 @@ bus_id=0
clock=1000
responder_set=false
width=64
port=system.physmem.port system.cpu.l2cache.mem_side
port=system.physmem.port[0] system.cpu.l2cache.mem_side
[system.physmem]
type=PhysicalMemory

View file

@ -26,7 +26,7 @@ block_size=64
type=LiveProcess
cmd=mcf mcf.in
executable=/dist/m5/cpu2000/binaries/sparc/linux/mcf
input=/dist/m5/cpu2000/data/mcf/lgred/input/mcf.in
input=/dist/m5/cpu2000/data/mcf/smred/input/mcf.in
output=cout
env=
cwd=build/SPARC_SE/tests/fast/long/10.mcf/sparc/linux/simple-timing
@ -94,7 +94,7 @@ prefetch_access=false
prefetcher_size=100
prefetch_past_page=false
prefetch_serial_squash=false
prefetch_latency=10
prefetch_latency=10000
prefetch_degree=1
prefetch_policy=none
prefetch_cache_check_push=true
@ -131,7 +131,7 @@ prefetch_access=false
prefetcher_size=100
prefetch_past_page=false
prefetch_serial_squash=false
prefetch_latency=10
prefetch_latency=10000
prefetch_degree=1
prefetch_policy=none
prefetch_cache_check_push=true
@ -168,7 +168,7 @@ prefetch_access=false
prefetcher_size=100
prefetch_past_page=false
prefetch_serial_squash=false
prefetch_latency=10
prefetch_latency=100000
prefetch_degree=1
prefetch_policy=none
prefetch_cache_check_push=true

View file

@ -1,77 +1,77 @@
---------- Begin Simulation Statistics ----------
host_inst_rate 480485 # Simulator instruction rate (inst/s)
host_mem_usage 155316 # Number of bytes of host memory used
host_seconds 3578.87 # Real time elapsed on the host
host_tick_rate 745845171 # Simulator tick rate (ticks/s)
host_inst_rate 697152 # Simulator instruction rate (inst/s)
host_mem_usage 155896 # Number of bytes of host memory used
host_seconds 349.77 # Real time elapsed on the host
host_tick_rate 1027373651 # Simulator tick rate (ticks/s)
sim_freq 1000000000000 # Frequency of simulated ticks
sim_insts 1719594534 # Number of instructions simulated
sim_seconds 2.669285 # Number of seconds simulated
sim_ticks 2669284585000 # Number of ticks simulated
system.cpu.dcache.ReadReq_accesses 607807189 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_avg_miss_latency 12893.226605 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency 11893.226605 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_hits 594739458 # number of ReadReq hits
system.cpu.dcache.ReadReq_miss_latency 168485217000 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_rate 0.021500 # miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_misses 13067731 # number of ReadReq misses
system.cpu.dcache.ReadReq_mshr_miss_latency 155417486000 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_rate 0.021500 # mshr miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_mshr_misses 13067731 # number of ReadReq MSHR misses
system.cpu.dcache.SwapReq_accesses 15448 # number of SwapReq accesses(hits+misses)
system.cpu.dcache.SwapReq_avg_miss_latency 13090.909091 # average SwapReq miss latency
system.cpu.dcache.SwapReq_avg_mshr_miss_latency 12090.909091 # average SwapReq mshr miss latency
system.cpu.dcache.SwapReq_hits 15437 # number of SwapReq hits
system.cpu.dcache.SwapReq_miss_latency 144000 # number of SwapReq miss cycles
system.cpu.dcache.SwapReq_miss_rate 0.000712 # miss rate for SwapReq accesses
system.cpu.dcache.SwapReq_misses 11 # number of SwapReq misses
system.cpu.dcache.SwapReq_mshr_miss_latency 133000 # number of SwapReq MSHR miss cycles
system.cpu.dcache.SwapReq_mshr_miss_rate 0.000712 # mshr miss rate for SwapReq accesses
system.cpu.dcache.SwapReq_mshr_misses 11 # number of SwapReq MSHR misses
system.cpu.dcache.WriteReq_accesses 166970997 # number of WriteReq accesses(hits+misses)
system.cpu.dcache.WriteReq_avg_miss_latency 12404.292450 # average WriteReq miss latency
system.cpu.dcache.WriteReq_avg_mshr_miss_latency 11404.292450 # average WriteReq mshr miss latency
system.cpu.dcache.WriteReq_hits 165264000 # number of WriteReq hits
system.cpu.dcache.WriteReq_miss_latency 21174090000 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_rate 0.010223 # miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_misses 1706997 # number of WriteReq misses
system.cpu.dcache.WriteReq_mshr_miss_latency 19467093000 # number of WriteReq MSHR miss cycles
system.cpu.dcache.WriteReq_mshr_miss_rate 0.010223 # mshr miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_mshr_misses 1706997 # number of WriteReq MSHR misses
sim_insts 243840172 # Number of instructions simulated
sim_seconds 0.359341 # Number of seconds simulated
sim_ticks 359340764000 # Number of ticks simulated
system.cpu.dcache.ReadReq_accesses 82219469 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_avg_miss_latency 12000.343864 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency 11000.343864 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_hits 81326673 # number of ReadReq hits
system.cpu.dcache.ReadReq_miss_latency 10713859000 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_rate 0.010859 # miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_misses 892796 # number of ReadReq misses
system.cpu.dcache.ReadReq_mshr_miss_latency 9821063000 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_rate 0.010859 # mshr miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_mshr_misses 892796 # number of ReadReq MSHR misses
system.cpu.dcache.SwapReq_accesses 3886 # number of SwapReq accesses(hits+misses)
system.cpu.dcache.SwapReq_avg_miss_latency 12500 # average SwapReq miss latency
system.cpu.dcache.SwapReq_avg_mshr_miss_latency 11500 # average SwapReq mshr miss latency
system.cpu.dcache.SwapReq_hits 3882 # number of SwapReq hits
system.cpu.dcache.SwapReq_miss_latency 50000 # number of SwapReq miss cycles
system.cpu.dcache.SwapReq_miss_rate 0.001029 # miss rate for SwapReq accesses
system.cpu.dcache.SwapReq_misses 4 # number of SwapReq misses
system.cpu.dcache.SwapReq_mshr_miss_latency 46000 # number of SwapReq MSHR miss cycles
system.cpu.dcache.SwapReq_mshr_miss_rate 0.001029 # mshr miss rate for SwapReq accesses
system.cpu.dcache.SwapReq_mshr_misses 4 # number of SwapReq MSHR misses
system.cpu.dcache.WriteReq_accesses 22901836 # number of WriteReq accesses(hits+misses)
system.cpu.dcache.WriteReq_avg_miss_latency 12623.899964 # average WriteReq miss latency
system.cpu.dcache.WriteReq_avg_mshr_miss_latency 11623.899964 # average WriteReq mshr miss latency
system.cpu.dcache.WriteReq_hits 22855133 # number of WriteReq hits
system.cpu.dcache.WriteReq_miss_latency 589574000 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_rate 0.002039 # miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_misses 46703 # number of WriteReq misses
system.cpu.dcache.WriteReq_mshr_miss_latency 542871000 # number of WriteReq MSHR miss cycles
system.cpu.dcache.WriteReq_mshr_miss_rate 0.002039 # mshr miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_mshr_misses 46703 # number of WriteReq MSHR misses
system.cpu.dcache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.dcache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.dcache.avg_refs 51.440428 # Average number of references to valid blocks.
system.cpu.dcache.avg_refs 110.894471 # Average number of references to valid blocks.
system.cpu.dcache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.dcache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.dcache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.cache_copies 0 # number of cache copies performed
system.cpu.dcache.demand_accesses 774778186 # number of demand (read+write) accesses
system.cpu.dcache.demand_avg_miss_latency 12836.737637 # average overall miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency 11836.737637 # average overall mshr miss latency
system.cpu.dcache.demand_hits 760003458 # number of demand (read+write) hits
system.cpu.dcache.demand_miss_latency 189659307000 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_rate 0.019070 # miss rate for demand accesses
system.cpu.dcache.demand_misses 14774728 # number of demand (read+write) misses
system.cpu.dcache.demand_accesses 105121305 # number of demand (read+write) accesses
system.cpu.dcache.demand_avg_miss_latency 12031.341172 # average overall miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency 11031.341172 # average overall mshr miss latency
system.cpu.dcache.demand_hits 104181806 # number of demand (read+write) hits
system.cpu.dcache.demand_miss_latency 11303433000 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_rate 0.008937 # miss rate for demand accesses
system.cpu.dcache.demand_misses 939499 # number of demand (read+write) misses
system.cpu.dcache.demand_mshr_hits 0 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_miss_latency 174884579000 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_rate 0.019070 # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_misses 14774728 # number of demand (read+write) MSHR misses
system.cpu.dcache.demand_mshr_miss_latency 10363934000 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_rate 0.008937 # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_misses 939499 # number of demand (read+write) MSHR misses
system.cpu.dcache.fast_writes 0 # number of fast writes performed
system.cpu.dcache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.dcache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.dcache.overall_accesses 774778186 # number of overall (read+write) accesses
system.cpu.dcache.overall_avg_miss_latency 12836.737637 # average overall miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency 11836.737637 # average overall mshr miss latency
system.cpu.dcache.overall_accesses 105121305 # number of overall (read+write) accesses
system.cpu.dcache.overall_avg_miss_latency 12031.341172 # average overall miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency 11031.341172 # average overall mshr miss latency
system.cpu.dcache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.dcache.overall_hits 760003458 # number of overall hits
system.cpu.dcache.overall_miss_latency 189659307000 # number of overall miss cycles
system.cpu.dcache.overall_miss_rate 0.019070 # miss rate for overall accesses
system.cpu.dcache.overall_misses 14774728 # number of overall misses
system.cpu.dcache.overall_hits 104181806 # number of overall hits
system.cpu.dcache.overall_miss_latency 11303433000 # number of overall miss cycles
system.cpu.dcache.overall_miss_rate 0.008937 # miss rate for overall accesses
system.cpu.dcache.overall_misses 939499 # number of overall misses
system.cpu.dcache.overall_mshr_hits 0 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_miss_latency 174884579000 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_rate 0.019070 # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_misses 14774728 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_miss_latency 10363934000 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_rate 0.008937 # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_misses 939499 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.dcache.overall_mshr_uncacheable_misses 0 # number of overall MSHR uncacheable misses
system.cpu.dcache.prefetcher.num_hwpf_already_in_cache 0 # number of hwpf that were already in the cache
@ -83,57 +83,57 @@ system.cpu.dcache.prefetcher.num_hwpf_issued 0
system.cpu.dcache.prefetcher.num_hwpf_removed_MSHR_hit 0 # number of hwpf removed because MSHR allocated
system.cpu.dcache.prefetcher.num_hwpf_span_page 0 # number of hwpf spanning a virtual page
system.cpu.dcache.prefetcher.num_hwpf_squashed_from_miss 0 # number of hwpf that got squashed due to a miss aborting calculation time
system.cpu.dcache.replacements 14770643 # number of replacements
system.cpu.dcache.sampled_refs 14774739 # Sample count of references to valid blocks.
system.cpu.dcache.replacements 935407 # number of replacements
system.cpu.dcache.sampled_refs 939503 # Sample count of references to valid blocks.
system.cpu.dcache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.dcache.tagsinuse 4094.628585 # Cycle average of tags in use
system.cpu.dcache.total_refs 760018895 # Total number of references to valid blocks.
system.cpu.dcache.warmup_cycle 3913237000 # Cycle when the warmup percentage was hit.
system.cpu.dcache.writebacks 4191356 # number of writebacks
system.cpu.icache.ReadReq_accesses 1719594535 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_avg_miss_latency 13991.120977 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency 12991.120977 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_hits 1719593634 # number of ReadReq hits
system.cpu.icache.ReadReq_miss_latency 12606000 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_rate 0.000001 # miss rate for ReadReq accesses
system.cpu.icache.ReadReq_misses 901 # number of ReadReq misses
system.cpu.icache.ReadReq_mshr_miss_latency 11705000 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_rate 0.000001 # mshr miss rate for ReadReq accesses
system.cpu.icache.ReadReq_mshr_misses 901 # number of ReadReq MSHR misses
system.cpu.dcache.tagsinuse 3560.887601 # Cycle average of tags in use
system.cpu.dcache.total_refs 104185688 # Total number of references to valid blocks.
system.cpu.dcache.warmup_cycle 134116230000 # Cycle when the warmup percentage was hit.
system.cpu.dcache.writebacks 94807 # number of writebacks
system.cpu.icache.ReadReq_accesses 243840173 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_avg_miss_latency 13993.174061 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency 12993.174061 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_hits 243839294 # number of ReadReq hits
system.cpu.icache.ReadReq_miss_latency 12300000 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_rate 0.000004 # miss rate for ReadReq accesses
system.cpu.icache.ReadReq_misses 879 # number of ReadReq misses
system.cpu.icache.ReadReq_mshr_miss_latency 11421000 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_rate 0.000004 # mshr miss rate for ReadReq accesses
system.cpu.icache.ReadReq_mshr_misses 879 # number of ReadReq MSHR misses
system.cpu.icache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.icache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.icache.avg_refs 1908538.994451 # Average number of references to valid blocks.
system.cpu.icache.avg_refs 277405.340159 # Average number of references to valid blocks.
system.cpu.icache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.icache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.icache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.icache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.icache.cache_copies 0 # number of cache copies performed
system.cpu.icache.demand_accesses 1719594535 # number of demand (read+write) accesses
system.cpu.icache.demand_avg_miss_latency 13991.120977 # average overall miss latency
system.cpu.icache.demand_avg_mshr_miss_latency 12991.120977 # average overall mshr miss latency
system.cpu.icache.demand_hits 1719593634 # number of demand (read+write) hits
system.cpu.icache.demand_miss_latency 12606000 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_rate 0.000001 # miss rate for demand accesses
system.cpu.icache.demand_misses 901 # number of demand (read+write) misses
system.cpu.icache.demand_accesses 243840173 # number of demand (read+write) accesses
system.cpu.icache.demand_avg_miss_latency 13993.174061 # average overall miss latency
system.cpu.icache.demand_avg_mshr_miss_latency 12993.174061 # average overall mshr miss latency
system.cpu.icache.demand_hits 243839294 # number of demand (read+write) hits
system.cpu.icache.demand_miss_latency 12300000 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_rate 0.000004 # miss rate for demand accesses
system.cpu.icache.demand_misses 879 # number of demand (read+write) misses
system.cpu.icache.demand_mshr_hits 0 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_miss_latency 11705000 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_rate 0.000001 # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_misses 901 # number of demand (read+write) MSHR misses
system.cpu.icache.demand_mshr_miss_latency 11421000 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_rate 0.000004 # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_misses 879 # number of demand (read+write) MSHR misses
system.cpu.icache.fast_writes 0 # number of fast writes performed
system.cpu.icache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.icache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.icache.overall_accesses 1719594535 # number of overall (read+write) accesses
system.cpu.icache.overall_avg_miss_latency 13991.120977 # average overall miss latency
system.cpu.icache.overall_avg_mshr_miss_latency 12991.120977 # average overall mshr miss latency
system.cpu.icache.overall_accesses 243840173 # number of overall (read+write) accesses
system.cpu.icache.overall_avg_miss_latency 13993.174061 # average overall miss latency
system.cpu.icache.overall_avg_mshr_miss_latency 12993.174061 # average overall mshr miss latency
system.cpu.icache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.icache.overall_hits 1719593634 # number of overall hits
system.cpu.icache.overall_miss_latency 12606000 # number of overall miss cycles
system.cpu.icache.overall_miss_rate 0.000001 # miss rate for overall accesses
system.cpu.icache.overall_misses 901 # number of overall misses
system.cpu.icache.overall_hits 243839294 # number of overall hits
system.cpu.icache.overall_miss_latency 12300000 # number of overall miss cycles
system.cpu.icache.overall_miss_rate 0.000004 # miss rate for overall accesses
system.cpu.icache.overall_misses 879 # number of overall misses
system.cpu.icache.overall_mshr_hits 0 # number of overall MSHR hits
system.cpu.icache.overall_mshr_miss_latency 11705000 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_rate 0.000001 # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_misses 901 # number of overall MSHR misses
system.cpu.icache.overall_mshr_miss_latency 11421000 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_rate 0.000004 # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_misses 879 # number of overall MSHR misses
system.cpu.icache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.icache.overall_mshr_uncacheable_misses 0 # number of overall MSHR uncacheable misses
system.cpu.icache.prefetcher.num_hwpf_already_in_cache 0 # number of hwpf that were already in the cache
@ -145,64 +145,60 @@ system.cpu.icache.prefetcher.num_hwpf_issued 0
system.cpu.icache.prefetcher.num_hwpf_removed_MSHR_hit 0 # number of hwpf removed because MSHR allocated
system.cpu.icache.prefetcher.num_hwpf_span_page 0 # number of hwpf spanning a virtual page
system.cpu.icache.prefetcher.num_hwpf_squashed_from_miss 0 # number of hwpf that got squashed due to a miss aborting calculation time
system.cpu.icache.replacements 31 # number of replacements
system.cpu.icache.sampled_refs 901 # Sample count of references to valid blocks.
system.cpu.icache.replacements 25 # number of replacements
system.cpu.icache.sampled_refs 879 # Sample count of references to valid blocks.
system.cpu.icache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.icache.tagsinuse 737.715884 # Cycle average of tags in use
system.cpu.icache.total_refs 1719593634 # Total number of references to valid blocks.
system.cpu.icache.tagsinuse 716.200092 # Cycle average of tags in use
system.cpu.icache.total_refs 243839294 # Total number of references to valid blocks.
system.cpu.icache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.icache.writebacks 0 # number of writebacks
system.cpu.idle_fraction 0 # Percentage of idle cycles
system.cpu.l2cache.ReadReq_accesses 14775639 # number of ReadReq accesses(hits+misses)
system.cpu.l2cache.ReadReq_avg_miss_latency 12999.785859 # average ReadReq miss latency
system.cpu.l2cache.ReadReq_avg_mshr_miss_latency 10999.785859 # average ReadReq mshr miss latency
system.cpu.l2cache.ReadReq_hits 8592784 # number of ReadReq hits
system.cpu.l2cache.ReadReq_miss_latency 80375791000 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_rate 0.418449 # miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_misses 6182855 # number of ReadReq misses
system.cpu.l2cache.ReadReq_mshr_miss_latency 68010081000 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_rate 0.418449 # mshr miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_mshr_misses 6182855 # number of ReadReq MSHR misses
system.cpu.l2cache.Writeback_accesses 4191356 # number of Writeback accesses(hits+misses)
system.cpu.l2cache.Writeback_hits 4164131 # number of Writeback hits
system.cpu.l2cache.Writeback_miss_rate 0.006496 # miss rate for Writeback accesses
system.cpu.l2cache.Writeback_misses 27225 # number of Writeback misses
system.cpu.l2cache.Writeback_mshr_miss_rate 0.006496 # mshr miss rate for Writeback accesses
system.cpu.l2cache.Writeback_mshr_misses 27225 # number of Writeback MSHR misses
system.cpu.l2cache.ReadReq_accesses 940381 # number of ReadReq accesses(hits+misses)
system.cpu.l2cache.ReadReq_avg_miss_latency 13000 # average ReadReq miss latency
system.cpu.l2cache.ReadReq_avg_mshr_miss_latency 11000 # average ReadReq mshr miss latency
system.cpu.l2cache.ReadReq_hits 924777 # number of ReadReq hits
system.cpu.l2cache.ReadReq_miss_latency 202852000 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_rate 0.016593 # miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_misses 15604 # number of ReadReq misses
system.cpu.l2cache.ReadReq_mshr_miss_latency 171644000 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_rate 0.016593 # mshr miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_mshr_misses 15604 # number of ReadReq MSHR misses
system.cpu.l2cache.Writeback_accesses 94807 # number of Writeback accesses(hits+misses)
system.cpu.l2cache.Writeback_hits 94807 # number of Writeback hits
system.cpu.l2cache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.l2cache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.l2cache.avg_refs 2.063273 # Average number of references to valid blocks.
system.cpu.l2cache.avg_refs 65.341195 # Average number of references to valid blocks.
system.cpu.l2cache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.l2cache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.l2cache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.l2cache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.l2cache.cache_copies 0 # number of cache copies performed
system.cpu.l2cache.demand_accesses 14775639 # number of demand (read+write) accesses
system.cpu.l2cache.demand_avg_miss_latency 12999.785859 # average overall miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency 10999.785859 # average overall mshr miss latency
system.cpu.l2cache.demand_hits 8592784 # number of demand (read+write) hits
system.cpu.l2cache.demand_miss_latency 80375791000 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_rate 0.418449 # miss rate for demand accesses
system.cpu.l2cache.demand_misses 6182855 # number of demand (read+write) misses
system.cpu.l2cache.demand_accesses 940381 # number of demand (read+write) accesses
system.cpu.l2cache.demand_avg_miss_latency 13000 # average overall miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency 11000 # average overall mshr miss latency
system.cpu.l2cache.demand_hits 924777 # number of demand (read+write) hits
system.cpu.l2cache.demand_miss_latency 202852000 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_rate 0.016593 # miss rate for demand accesses
system.cpu.l2cache.demand_misses 15604 # number of demand (read+write) misses
system.cpu.l2cache.demand_mshr_hits 0 # number of demand (read+write) MSHR hits
system.cpu.l2cache.demand_mshr_miss_latency 68010081000 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_rate 0.418449 # mshr miss rate for demand accesses
system.cpu.l2cache.demand_mshr_misses 6182855 # number of demand (read+write) MSHR misses
system.cpu.l2cache.demand_mshr_miss_latency 171644000 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_rate 0.016593 # mshr miss rate for demand accesses
system.cpu.l2cache.demand_mshr_misses 15604 # number of demand (read+write) MSHR misses
system.cpu.l2cache.fast_writes 0 # number of fast writes performed
system.cpu.l2cache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.l2cache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.l2cache.overall_accesses 18966995 # number of overall (read+write) accesses
system.cpu.l2cache.overall_avg_miss_latency 12942.794779 # average overall miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency 10999.785859 # average overall mshr miss latency
system.cpu.l2cache.overall_accesses 1035188 # number of overall (read+write) accesses
system.cpu.l2cache.overall_avg_miss_latency 13000 # average overall miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency 11000 # average overall mshr miss latency
system.cpu.l2cache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.l2cache.overall_hits 12756915 # number of overall hits
system.cpu.l2cache.overall_miss_latency 80375791000 # number of overall miss cycles
system.cpu.l2cache.overall_miss_rate 0.327415 # miss rate for overall accesses
system.cpu.l2cache.overall_misses 6210080 # number of overall misses
system.cpu.l2cache.overall_hits 1019584 # number of overall hits
system.cpu.l2cache.overall_miss_latency 202852000 # number of overall miss cycles
system.cpu.l2cache.overall_miss_rate 0.015074 # miss rate for overall accesses
system.cpu.l2cache.overall_misses 15604 # number of overall misses
system.cpu.l2cache.overall_mshr_hits 0 # number of overall MSHR hits
system.cpu.l2cache.overall_mshr_miss_latency 68010081000 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_rate 0.325980 # mshr miss rate for overall accesses
system.cpu.l2cache.overall_mshr_misses 6182855 # number of overall MSHR misses
system.cpu.l2cache.overall_mshr_miss_latency 171644000 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_rate 0.015074 # mshr miss rate for overall accesses
system.cpu.l2cache.overall_mshr_misses 15604 # number of overall MSHR misses
system.cpu.l2cache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.l2cache.overall_mshr_uncacheable_misses 0 # number of overall MSHR uncacheable misses
system.cpu.l2cache.prefetcher.num_hwpf_already_in_cache 0 # number of hwpf that were already in the cache
@ -214,17 +210,17 @@ system.cpu.l2cache.prefetcher.num_hwpf_issued 0
system.cpu.l2cache.prefetcher.num_hwpf_removed_MSHR_hit 0 # number of hwpf removed because MSHR allocated
system.cpu.l2cache.prefetcher.num_hwpf_span_page 0 # number of hwpf spanning a virtual page
system.cpu.l2cache.prefetcher.num_hwpf_squashed_from_miss 0 # number of hwpf that got squashed due to a miss aborting calculation time
system.cpu.l2cache.replacements 6150087 # number of replacements
system.cpu.l2cache.sampled_refs 6182855 # Sample count of references to valid blocks.
system.cpu.l2cache.replacements 0 # number of replacements
system.cpu.l2cache.sampled_refs 15604 # Sample count of references to valid blocks.
system.cpu.l2cache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.l2cache.tagsinuse 26129.060966 # Cycle average of tags in use
system.cpu.l2cache.total_refs 12756915 # Total number of references to valid blocks.
system.cpu.l2cache.warmup_cycle 806915893000 # Cycle when the warmup percentage was hit.
system.cpu.l2cache.writebacks 1069081 # number of writebacks
system.cpu.l2cache.tagsinuse 10833.027960 # Cycle average of tags in use
system.cpu.l2cache.total_refs 1019584 # Total number of references to valid blocks.
system.cpu.l2cache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.l2cache.writebacks 0 # number of writebacks
system.cpu.not_idle_fraction 1 # Percentage of non-idle cycles
system.cpu.numCycles 2669284585000 # number of cpu cycles simulated
system.cpu.num_insts 1719594534 # Number of instructions executed
system.cpu.num_refs 774793634 # Number of memory references
system.cpu.workload.PROG:num_syscalls 632 # Number of system calls
system.cpu.numCycles 359340764000 # number of cpu cycles simulated
system.cpu.num_insts 243840172 # Number of instructions executed
system.cpu.num_refs 105125191 # Number of memory references
system.cpu.workload.PROG:num_syscalls 428 # Number of system calls
---------- End Simulation Statistics ----------

File diff suppressed because it is too large Load diff

View file

@ -4,19 +4,15 @@ by Andreas Loebel
Copyright (c) 1998,1999 ZIB Berlin
All Rights Reserved.
nodes : 1800
active arcs : 8190
simplex iterations : 6837
flow value : 12860044181
new implicit arcs : 300000
active arcs : 308190
simplex iterations : 11843
flow value : 9360043604
new implicit arcs : 22787
active arcs : 330977
simplex iterations : 11931
flow value : 9360043512
checksum : 798014
nodes : 500
active arcs : 1905
simplex iterations : 1502
flow value : 4990014995
new implicit arcs : 23867
active arcs : 25772
simplex iterations : 2663
flow value : 3080014995
checksum : 68389
optimal
M5 Simulator System
@ -25,9 +21,9 @@ The Regents of The University of Michigan
All Rights Reserved
M5 compiled May 15 2007 13:02:31
M5 started Tue May 15 15:05:32 2007
M5 compiled Jun 21 2007 21:15:48
M5 started Fri Jun 22 02:01:52 2007
M5 executing on zizzer.eecs.umich.edu
command line: build/SPARC_SE/m5.fast -d build/SPARC_SE/tests/fast/long/10.mcf/sparc/linux/simple-timing tests/run.py long/10.mcf/sparc/linux/simple-timing
Global frequency set at 1000000000000 ticks per second
Exiting @ tick 2669284585000 because target called exit()
Exiting @ tick 359340764000 because target called exit()

View file

@ -29,5 +29,5 @@
m5.AddToPath('../configs/common')
from cpu2000 import mcf
workload = mcf(isa, opsys, 'lgred')
workload = mcf(isa, opsys, 'smred')
root.system.cpu.workload = workload.makeLiveProcess()

View file

@ -29,5 +29,5 @@
m5.AddToPath('../configs/common')
from cpu2000 import parser
workload = parser(isa, opsys, 'lgred')
workload = parser(isa, opsys, 'mdred')
root.system.cpu.workload = workload.makeLiveProcess()

View file

@ -21,6 +21,7 @@ SQEntries=32
SSITSize=1024
activity=0
backComSize=5
cachePorts=200
choiceCtrBits=2
choicePredictorSize=8192
clock=500
@ -74,6 +75,15 @@ renameToFetchDelay=1
renameToIEWDelay=2
renameToROBDelay=1
renameWidth=8
smtCommitPolicy=RoundRobin
smtFetchPolicy=SingleThread
smtIQPolicy=Partitioned
smtIQThreshold=100
smtLSQPolicy=Partitioned
smtLSQThreshold=100
smtNumFetchingThreads=1
smtROBPolicy=Partitioned
smtROBThreshold=100
squashWidth=8
system=system
trapLatency=13
@ -86,6 +96,7 @@ icache_port=system.cpu.icache.cpu_side
[system.cpu.dcache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -261,6 +272,7 @@ opLat=3
[system.cpu.icache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -299,6 +311,7 @@ mem_side=system.cpu.toL2Bus.port[0]
[system.cpu.l2cache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false

View file

@ -1,39 +1,40 @@
---------- Begin Simulation Statistics ----------
global.BPredUnit.BTBCorrect 0 # Number of correct BTB predictions (this stat may not work properly.
global.BPredUnit.BTBHits 524 # Number of BTB hits
global.BPredUnit.BTBLookups 1590 # Number of BTB lookups
global.BPredUnit.BTBHits 522 # Number of BTB hits
global.BPredUnit.BTBLookups 1584 # Number of BTB lookups
global.BPredUnit.RASInCorrect 57 # Number of incorrect RAS predictions.
global.BPredUnit.condIncorrect 422 # Number of conditional branches incorrect
global.BPredUnit.condPredicted 1093 # Number of conditional branches predicted
global.BPredUnit.lookups 1843 # Number of BP lookups
global.BPredUnit.condPredicted 1088 # Number of conditional branches predicted
global.BPredUnit.lookups 1837 # Number of BP lookups
global.BPredUnit.usedRAS 241 # Number of times the RAS was used to get a target.
host_inst_rate 7145 # Simulator instruction rate (inst/s)
host_seconds 0.79 # Real time elapsed on the host
host_tick_rate 5828052 # Simulator tick rate (ticks/s)
host_inst_rate 39303 # Simulator instruction rate (inst/s)
host_mem_usage 153768 # Number of bytes of host memory used
host_seconds 0.14 # Real time elapsed on the host
host_tick_rate 32016268 # Simulator tick rate (ticks/s)
memdepunit.memDep.conflictingLoads 17 # Number of conflicting loads.
memdepunit.memDep.conflictingStores 127 # Number of conflicting stores.
memdepunit.memDep.insertedLoads 1876 # Number of loads inserted to the mem dependence unit.
memdepunit.memDep.insertedStores 1144 # Number of stores inserted to the mem dependence unit.
memdepunit.memDep.insertedLoads 1874 # Number of loads inserted to the mem dependence unit.
memdepunit.memDep.insertedStores 1142 # Number of stores inserted to the mem dependence unit.
sim_freq 1000000000000 # Frequency of simulated ticks
sim_insts 5623 # Number of instructions simulated
sim_seconds 0.000005 # Number of seconds simulated
sim_ticks 4588000 # Number of ticks simulated
sim_ticks 4589500 # Number of ticks simulated
system.cpu.commit.COM:branches 862 # Number of branches committed
system.cpu.commit.COM:bw_lim_events 104 # number cycles where commit BW limit reached
system.cpu.commit.COM:bw_limited 0 # number of insts not committed due to BW limits
system.cpu.commit.COM:committed_per_cycle.start_dist # Number of insts commited each cycle
system.cpu.commit.COM:committed_per_cycle.samples 8514
system.cpu.commit.COM:committed_per_cycle.samples 8521
system.cpu.commit.COM:committed_per_cycle.min_value 0
0 6195 7276.25%
1 1158 1360.11%
2 469 550.86%
3 176 206.72%
4 131 153.86%
5 99 116.28%
6 109 128.02%
7 73 85.74%
8 104 122.15%
0 6200 7276.14%
1 1160 1361.34%
2 469 550.40%
3 177 207.72%
4 131 153.74%
5 98 115.01%
6 109 127.92%
7 73 85.67%
8 104 122.05%
system.cpu.commit.COM:committed_per_cycle.max_value 8
system.cpu.commit.COM:committed_per_cycle.end_dist
@ -45,27 +46,27 @@ system.cpu.commit.COM:swp_count 0 # Nu
system.cpu.commit.branchMispredicts 350 # The number of times a branch was mispredicted
system.cpu.commit.commitCommittedInsts 5640 # The number of committed instructions
system.cpu.commit.commitNonSpecStalls 17 # The number of times commit has been forced to stall to communicate backwards
system.cpu.commit.commitSquashedInsts 3588 # The number of squashed insts skipped by commit
system.cpu.commit.commitSquashedInsts 3571 # The number of squashed insts skipped by commit
system.cpu.committedInsts 5623 # Number of Instructions Simulated
system.cpu.committedInsts_total 5623 # Number of Instructions Simulated
system.cpu.cpi 1.635604 # CPI: Cycles Per Instruction
system.cpu.cpi_total 1.635604 # CPI: Total CPI of All Threads
system.cpu.dcache.ReadReq_accesses 1475 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_avg_miss_latency 5928.571429 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency 5385 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_hits 1342 # number of ReadReq hits
system.cpu.dcache.ReadReq_miss_latency 788500 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_rate 0.090169 # miss rate for ReadReq accesses
system.cpu.cpi 1.636315 # CPI: Cycles Per Instruction
system.cpu.cpi_total 1.636315 # CPI: Total CPI of All Threads
system.cpu.dcache.ReadReq_accesses 1470 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_avg_miss_latency 5932.330827 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency 5380 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_hits 1337 # number of ReadReq hits
system.cpu.dcache.ReadReq_miss_latency 789000 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_rate 0.090476 # miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_misses 133 # number of ReadReq misses
system.cpu.dcache.ReadReq_mshr_hits 33 # number of ReadReq MSHR hits
system.cpu.dcache.ReadReq_mshr_miss_latency 538500 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_rate 0.067797 # mshr miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_mshr_miss_latency 538000 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_rate 0.068027 # mshr miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_mshr_misses 100 # number of ReadReq MSHR misses
system.cpu.dcache.WriteReq_accesses 812 # number of WriteReq accesses(hits+misses)
system.cpu.dcache.WriteReq_avg_miss_latency 4501.457726 # average WriteReq miss latency
system.cpu.dcache.WriteReq_avg_miss_latency 4504.373178 # average WriteReq miss latency
system.cpu.dcache.WriteReq_avg_mshr_miss_latency 5116.438356 # average WriteReq mshr miss latency
system.cpu.dcache.WriteReq_hits 469 # number of WriteReq hits
system.cpu.dcache.WriteReq_miss_latency 1544000 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_latency 1545000 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_rate 0.422414 # miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_misses 343 # number of WriteReq misses
system.cpu.dcache.WriteReq_mshr_hits 270 # number of WriteReq MSHR hits
@ -74,37 +75,37 @@ system.cpu.dcache.WriteReq_mshr_miss_rate 0.089901 # m
system.cpu.dcache.WriteReq_mshr_misses 73 # number of WriteReq MSHR misses
system.cpu.dcache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.dcache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.dcache.avg_refs 10.468208 # Average number of references to valid blocks.
system.cpu.dcache.avg_refs 10.439306 # Average number of references to valid blocks.
system.cpu.dcache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.dcache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.dcache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.cache_copies 0 # number of cache copies performed
system.cpu.dcache.demand_accesses 2287 # number of demand (read+write) accesses
system.cpu.dcache.demand_avg_miss_latency 4900.210084 # average overall miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency 5271.676301 # average overall mshr miss latency
system.cpu.dcache.demand_hits 1811 # number of demand (read+write) hits
system.cpu.dcache.demand_miss_latency 2332500 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_rate 0.208133 # miss rate for demand accesses
system.cpu.dcache.demand_accesses 2282 # number of demand (read+write) accesses
system.cpu.dcache.demand_avg_miss_latency 4903.361345 # average overall miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency 5268.786127 # average overall mshr miss latency
system.cpu.dcache.demand_hits 1806 # number of demand (read+write) hits
system.cpu.dcache.demand_miss_latency 2334000 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_rate 0.208589 # miss rate for demand accesses
system.cpu.dcache.demand_misses 476 # number of demand (read+write) misses
system.cpu.dcache.demand_mshr_hits 303 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_miss_latency 912000 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_rate 0.075645 # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_miss_latency 911500 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_rate 0.075811 # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_misses 173 # number of demand (read+write) MSHR misses
system.cpu.dcache.fast_writes 0 # number of fast writes performed
system.cpu.dcache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.dcache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.dcache.overall_accesses 2287 # number of overall (read+write) accesses
system.cpu.dcache.overall_avg_miss_latency 4900.210084 # average overall miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency 5271.676301 # average overall mshr miss latency
system.cpu.dcache.overall_accesses 2282 # number of overall (read+write) accesses
system.cpu.dcache.overall_avg_miss_latency 4903.361345 # average overall miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency 5268.786127 # average overall mshr miss latency
system.cpu.dcache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.dcache.overall_hits 1811 # number of overall hits
system.cpu.dcache.overall_miss_latency 2332500 # number of overall miss cycles
system.cpu.dcache.overall_miss_rate 0.208133 # miss rate for overall accesses
system.cpu.dcache.overall_hits 1806 # number of overall hits
system.cpu.dcache.overall_miss_latency 2334000 # number of overall miss cycles
system.cpu.dcache.overall_miss_rate 0.208589 # miss rate for overall accesses
system.cpu.dcache.overall_misses 476 # number of overall misses
system.cpu.dcache.overall_mshr_hits 303 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_miss_latency 912000 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_rate 0.075645 # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_miss_latency 911500 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_rate 0.075811 # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_misses 173 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.dcache.overall_mshr_uncacheable_misses 0 # number of overall MSHR uncacheable misses
@ -120,88 +121,88 @@ system.cpu.dcache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.dcache.replacements 0 # number of replacements
system.cpu.dcache.sampled_refs 173 # Sample count of references to valid blocks.
system.cpu.dcache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.dcache.tagsinuse 112.670676 # Cycle average of tags in use
system.cpu.dcache.total_refs 1811 # Total number of references to valid blocks.
system.cpu.dcache.tagsinuse 112.669258 # Cycle average of tags in use
system.cpu.dcache.total_refs 1806 # Total number of references to valid blocks.
system.cpu.dcache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.dcache.writebacks 0 # number of writebacks
system.cpu.decode.DECODE:BlockedCycles 389 # Number of cycles decode is blocked
system.cpu.decode.DECODE:BranchMispred 75 # Number of times decode detected a branch misprediction
system.cpu.decode.DECODE:BranchResolved 144 # Number of times decode resolved a branch
system.cpu.decode.DECODE:DecodedInsts 10499 # Number of instructions handled by decode
system.cpu.decode.DECODE:BranchResolved 143 # Number of times decode resolved a branch
system.cpu.decode.DECODE:DecodedInsts 10466 # Number of instructions handled by decode
system.cpu.decode.DECODE:IdleCycles 6230 # Number of cycles decode is idle
system.cpu.decode.DECODE:RunCycles 1848 # Number of cycles decode is running
system.cpu.decode.DECODE:SquashCycles 682 # Number of cycles decode is squashing
system.cpu.decode.DECODE:RunCycles 1855 # Number of cycles decode is running
system.cpu.decode.DECODE:SquashCycles 679 # Number of cycles decode is squashing
system.cpu.decode.DECODE:SquashedInsts 228 # Number of squashed instructions handled by decode
system.cpu.decode.DECODE:UnblockCycles 48 # Number of cycles decode is unblocking
system.cpu.fetch.Branches 1843 # Number of branches that fetch encountered
system.cpu.fetch.CacheLines 1471 # Number of cache lines fetched
system.cpu.fetch.Cycles 3451 # Number of cycles fetch has run and was not squashing or blocked
system.cpu.fetch.IcacheSquashes 269 # Number of outstanding Icache misses that were squashed
system.cpu.fetch.Insts 11450 # Number of instructions fetch has processed
system.cpu.fetch.Branches 1837 # Number of branches that fetch encountered
system.cpu.fetch.CacheLines 1469 # Number of cache lines fetched
system.cpu.fetch.Cycles 3456 # Number of cycles fetch has run and was not squashing or blocked
system.cpu.fetch.IcacheSquashes 267 # Number of outstanding Icache misses that were squashed
system.cpu.fetch.Insts 11417 # Number of instructions fetch has processed
system.cpu.fetch.SquashCycles 455 # Number of cycles fetch has spent squashing
system.cpu.fetch.branchRate 0.200391 # Number of branch fetches per cycle
system.cpu.fetch.icacheStallCycles 1471 # Number of cycles fetch is stalled on an Icache miss
system.cpu.fetch.predictedBranches 765 # Number of branches that fetch has predicted taken
system.cpu.fetch.rate 1.244971 # Number of inst fetches per cycle
system.cpu.fetch.branchRate 0.199652 # Number of branch fetches per cycle
system.cpu.fetch.icacheStallCycles 1469 # Number of cycles fetch is stalled on an Icache miss
system.cpu.fetch.predictedBranches 763 # Number of branches that fetch has predicted taken
system.cpu.fetch.rate 1.240843 # Number of inst fetches per cycle
system.cpu.fetch.rateDist.start_dist # Number of instructions fetched each cycle (Total)
system.cpu.fetch.rateDist.samples 9197
system.cpu.fetch.rateDist.samples 9201
system.cpu.fetch.rateDist.min_value 0
0 7219 7849.30%
1 167 181.58%
2 147 159.83%
3 129 140.26%
4 200 217.46%
5 139 151.14%
6 181 196.80%
7 99 107.64%
8 916 995.98%
0 7216 7842.63%
1 168 182.59%
2 148 160.85%
3 136 147.81%
4 214 232.58%
5 138 149.98%
6 177 192.37%
7 95 103.25%
8 909 987.94%
system.cpu.fetch.rateDist.max_value 8
system.cpu.fetch.rateDist.end_dist
system.cpu.icache.ReadReq_accesses 1471 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_avg_miss_latency 5375.757576 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency 4524.038462 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_hits 1141 # number of ReadReq hits
system.cpu.icache.ReadReq_miss_latency 1774000 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_rate 0.224337 # miss rate for ReadReq accesses
system.cpu.icache.ReadReq_accesses 1469 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_avg_miss_latency 5381.818182 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency 4530.448718 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_hits 1139 # number of ReadReq hits
system.cpu.icache.ReadReq_miss_latency 1776000 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_rate 0.224643 # miss rate for ReadReq accesses
system.cpu.icache.ReadReq_misses 330 # number of ReadReq misses
system.cpu.icache.ReadReq_mshr_hits 18 # number of ReadReq MSHR hits
system.cpu.icache.ReadReq_mshr_miss_latency 1411500 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_rate 0.212101 # mshr miss rate for ReadReq accesses
system.cpu.icache.ReadReq_mshr_miss_latency 1413500 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_rate 0.212389 # mshr miss rate for ReadReq accesses
system.cpu.icache.ReadReq_mshr_misses 312 # number of ReadReq MSHR misses
system.cpu.icache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.icache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.icache.avg_refs 3.657051 # Average number of references to valid blocks.
system.cpu.icache.avg_refs 3.650641 # Average number of references to valid blocks.
system.cpu.icache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.icache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.icache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.icache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.icache.cache_copies 0 # number of cache copies performed
system.cpu.icache.demand_accesses 1471 # number of demand (read+write) accesses
system.cpu.icache.demand_avg_miss_latency 5375.757576 # average overall miss latency
system.cpu.icache.demand_avg_mshr_miss_latency 4524.038462 # average overall mshr miss latency
system.cpu.icache.demand_hits 1141 # number of demand (read+write) hits
system.cpu.icache.demand_miss_latency 1774000 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_rate 0.224337 # miss rate for demand accesses
system.cpu.icache.demand_accesses 1469 # number of demand (read+write) accesses
system.cpu.icache.demand_avg_miss_latency 5381.818182 # average overall miss latency
system.cpu.icache.demand_avg_mshr_miss_latency 4530.448718 # average overall mshr miss latency
system.cpu.icache.demand_hits 1139 # number of demand (read+write) hits
system.cpu.icache.demand_miss_latency 1776000 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_rate 0.224643 # miss rate for demand accesses
system.cpu.icache.demand_misses 330 # number of demand (read+write) misses
system.cpu.icache.demand_mshr_hits 18 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_miss_latency 1411500 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_rate 0.212101 # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_miss_latency 1413500 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_rate 0.212389 # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_misses 312 # number of demand (read+write) MSHR misses
system.cpu.icache.fast_writes 0 # number of fast writes performed
system.cpu.icache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.icache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.icache.overall_accesses 1471 # number of overall (read+write) accesses
system.cpu.icache.overall_avg_miss_latency 5375.757576 # average overall miss latency
system.cpu.icache.overall_avg_mshr_miss_latency 4524.038462 # average overall mshr miss latency
system.cpu.icache.overall_accesses 1469 # number of overall (read+write) accesses
system.cpu.icache.overall_avg_miss_latency 5381.818182 # average overall miss latency
system.cpu.icache.overall_avg_mshr_miss_latency 4530.448718 # average overall mshr miss latency
system.cpu.icache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.icache.overall_hits 1141 # number of overall hits
system.cpu.icache.overall_miss_latency 1774000 # number of overall miss cycles
system.cpu.icache.overall_miss_rate 0.224337 # miss rate for overall accesses
system.cpu.icache.overall_hits 1139 # number of overall hits
system.cpu.icache.overall_miss_latency 1776000 # number of overall miss cycles
system.cpu.icache.overall_miss_rate 0.224643 # miss rate for overall accesses
system.cpu.icache.overall_misses 330 # number of overall misses
system.cpu.icache.overall_mshr_hits 18 # number of overall MSHR hits
system.cpu.icache.overall_mshr_miss_latency 1411500 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_rate 0.212101 # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_miss_latency 1413500 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_rate 0.212389 # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_misses 312 # number of overall MSHR misses
system.cpu.icache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.icache.overall_mshr_uncacheable_misses 0 # number of overall MSHR uncacheable misses
@ -217,39 +218,39 @@ system.cpu.icache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.icache.replacements 0 # number of replacements
system.cpu.icache.sampled_refs 312 # Sample count of references to valid blocks.
system.cpu.icache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.icache.tagsinuse 165.938349 # Cycle average of tags in use
system.cpu.icache.total_refs 1141 # Total number of references to valid blocks.
system.cpu.icache.tagsinuse 165.921810 # Cycle average of tags in use
system.cpu.icache.total_refs 1139 # Total number of references to valid blocks.
system.cpu.icache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.icache.writebacks 0 # number of writebacks
system.cpu.idleCycles 2475 # Total number of cycles that the CPU has spent unscheduled due to idling
system.cpu.iew.EXEC:branches 1148 # Number of branches executed
system.cpu.idleCycles 2474 # Total number of cycles that the CPU has spent unscheduled due to idling
system.cpu.iew.EXEC:branches 1144 # Number of branches executed
system.cpu.iew.EXEC:nop 40 # number of nop insts executed
system.cpu.iew.EXEC:rate 0.837338 # Inst execution rate
system.cpu.iew.EXEC:refs 2524 # number of memory reference insts executed
system.cpu.iew.EXEC:rate 0.835018 # Inst execution rate
system.cpu.iew.EXEC:refs 2519 # number of memory reference insts executed
system.cpu.iew.EXEC:stores 977 # Number of stores executed
system.cpu.iew.EXEC:swp 0 # number of swp insts executed
system.cpu.iew.WB:consumers 5205 # num instructions consuming a value
system.cpu.iew.WB:count 7402 # cumulative count of insts written-back
system.cpu.iew.WB:fanout 0.742747 # average fanout of values written-back
system.cpu.iew.WB:consumers 5193 # num instructions consuming a value
system.cpu.iew.WB:count 7387 # cumulative count of insts written-back
system.cpu.iew.WB:fanout 0.742923 # average fanout of values written-back
system.cpu.iew.WB:penalized 0 # number of instrctions required to write to 'other' IQ
system.cpu.iew.WB:penalized_rate 0 # fraction of instructions written-back that wrote to 'other' IQ
system.cpu.iew.WB:producers 3866 # num instructions producing a value
system.cpu.iew.WB:rate 0.804828 # insts written-back per cycle
system.cpu.iew.WB:sent 7467 # cumulative count of insts sent to commit
system.cpu.iew.branchMispredicts 374 # Number of branch mispredicts detected at execute
system.cpu.iew.WB:producers 3858 # num instructions producing a value
system.cpu.iew.WB:rate 0.802848 # insts written-back per cycle
system.cpu.iew.WB:sent 7452 # cumulative count of insts sent to commit
system.cpu.iew.branchMispredicts 373 # Number of branch mispredicts detected at execute
system.cpu.iew.iewBlockCycles 4 # Number of cycles IEW is blocking
system.cpu.iew.iewDispLoadInsts 1876 # Number of dispatched load instructions
system.cpu.iew.iewDispLoadInsts 1874 # Number of dispatched load instructions
system.cpu.iew.iewDispNonSpecInsts 22 # Number of dispatched non-speculative instructions
system.cpu.iew.iewDispSquashedInsts 315 # Number of squashed instructions skipped by dispatch
system.cpu.iew.iewDispStoreInsts 1144 # Number of dispatched store instructions
system.cpu.iew.iewDispatchedInsts 9245 # Number of instructions dispatched to IQ
system.cpu.iew.iewExecLoadInsts 1547 # Number of load instructions executed
system.cpu.iew.iewExecSquashedInsts 280 # Number of squashed instructions skipped in execute
system.cpu.iew.iewExecutedInsts 7701 # Number of executed instructions
system.cpu.iew.iewDispSquashedInsts 302 # Number of squashed instructions skipped by dispatch
system.cpu.iew.iewDispStoreInsts 1142 # Number of dispatched store instructions
system.cpu.iew.iewDispatchedInsts 9228 # Number of instructions dispatched to IQ
system.cpu.iew.iewExecLoadInsts 1542 # Number of load instructions executed
system.cpu.iew.iewExecSquashedInsts 285 # Number of squashed instructions skipped in execute
system.cpu.iew.iewExecutedInsts 7683 # Number of executed instructions
system.cpu.iew.iewIQFullEvents 0 # Number of times the IQ has become full, causing a stall
system.cpu.iew.iewIdleCycles 0 # Number of cycles IEW is idle
system.cpu.iew.iewLSQFullEvents 0 # Number of times the LSQ has become full, causing a stall
system.cpu.iew.iewSquashCycles 682 # Number of cycles IEW is squashing
system.cpu.iew.iewSquashCycles 679 # Number of cycles IEW is squashing
system.cpu.iew.iewUnblockCycles 0 # Number of cycles IEW is unblocking
system.cpu.iew.lsq.thread.0.blockedLoads 0 # Number of blocked loads due to partial load-store forwarding
system.cpu.iew.lsq.thread.0.cacheBlocked 0 # Number of times an access to memory failed due to the cache being blocked
@ -259,17 +260,17 @@ system.cpu.iew.lsq.thread.0.invAddrLoads 0 # Nu
system.cpu.iew.lsq.thread.0.invAddrSwpfs 0 # Number of software prefetches ignored due to an invalid address
system.cpu.iew.lsq.thread.0.memOrderViolation 63 # Number of memory ordering violations
system.cpu.iew.lsq.thread.0.rescheduledLoads 1 # Number of loads that were rescheduled
system.cpu.iew.lsq.thread.0.squashedLoads 897 # Number of loads squashed
system.cpu.iew.lsq.thread.0.squashedStores 332 # Number of stores squashed
system.cpu.iew.lsq.thread.0.squashedLoads 895 # Number of loads squashed
system.cpu.iew.lsq.thread.0.squashedStores 330 # Number of stores squashed
system.cpu.iew.memOrderViolationEvents 63 # Number of memory order violations
system.cpu.iew.predictedNotTakenIncorrect 263 # Number of branches that were predicted not taken incorrectly
system.cpu.iew.predictedNotTakenIncorrect 262 # Number of branches that were predicted not taken incorrectly
system.cpu.iew.predictedTakenIncorrect 111 # Number of branches that were predicted taken incorrectly
system.cpu.ipc 0.611395 # IPC: Instructions Per Cycle
system.cpu.ipc_total 0.611395 # IPC: Total IPC of All Threads
system.cpu.iq.ISSUE:FU_type_0 7981 # Type of FU issued
system.cpu.ipc 0.611129 # IPC: Instructions Per Cycle
system.cpu.ipc_total 0.611129 # IPC: Total IPC of All Threads
system.cpu.iq.ISSUE:FU_type_0 7968 # Type of FU issued
system.cpu.iq.ISSUE:FU_type_0.start_dist
No_OpClass 2 0.03% # Type of FU issued
IntAlu 5322 66.68% # Type of FU issued
IntAlu 5314 66.69% # Type of FU issued
IntMult 1 0.01% # Type of FU issued
IntDiv 0 0.00% # Type of FU issued
FloatAdd 2 0.03% # Type of FU issued
@ -278,13 +279,13 @@ system.cpu.iq.ISSUE:FU_type_0.start_dist
FloatMult 0 0.00% # Type of FU issued
FloatDiv 0 0.00% # Type of FU issued
FloatSqrt 0 0.00% # Type of FU issued
MemRead 1662 20.82% # Type of FU issued
MemWrite 992 12.43% # Type of FU issued
MemRead 1659 20.82% # Type of FU issued
MemWrite 990 12.42% # Type of FU issued
IprAccess 0 0.00% # Type of FU issued
InstPrefetch 0 0.00% # Type of FU issued
system.cpu.iq.ISSUE:FU_type_0.end_dist
system.cpu.iq.ISSUE:fu_busy_cnt 106 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_rate 0.013282 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_busy_cnt 105 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_rate 0.013178 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_full.start_dist
No_OpClass 0 0.00% # attempts to use FU when none available
IntAlu 0 0.00% # attempts to use FU when none available
@ -296,41 +297,41 @@ system.cpu.iq.ISSUE:fu_full.start_dist
FloatMult 0 0.00% # attempts to use FU when none available
FloatDiv 0 0.00% # attempts to use FU when none available
FloatSqrt 0 0.00% # attempts to use FU when none available
MemRead 71 66.98% # attempts to use FU when none available
MemWrite 35 33.02% # attempts to use FU when none available
MemRead 70 66.67% # attempts to use FU when none available
MemWrite 35 33.33% # attempts to use FU when none available
IprAccess 0 0.00% # attempts to use FU when none available
InstPrefetch 0 0.00% # attempts to use FU when none available
system.cpu.iq.ISSUE:fu_full.end_dist
system.cpu.iq.ISSUE:issued_per_cycle.start_dist # Number of insts issued each cycle
system.cpu.iq.ISSUE:issued_per_cycle.samples 9197
system.cpu.iq.ISSUE:issued_per_cycle.samples 9201
system.cpu.iq.ISSUE:issued_per_cycle.min_value 0
0 5952 6471.68%
1 1107 1203.65%
2 919 999.24%
3 442 480.59%
4 375 407.74%
5 250 271.83%
6 115 125.04%
7 26 28.27%
8 11 11.96%
0 5952 6468.86%
1 1111 1207.48%
2 928 1008.59%
3 433 470.60%
4 378 410.82%
5 251 272.80%
6 111 120.64%
7 27 29.34%
8 10 10.87%
system.cpu.iq.ISSUE:issued_per_cycle.max_value 8
system.cpu.iq.ISSUE:issued_per_cycle.end_dist
system.cpu.iq.ISSUE:rate 0.867783 # Inst issue rate
system.cpu.iq.iqInstsAdded 9183 # Number of instructions added to the IQ (excludes non-spec)
system.cpu.iq.iqInstsIssued 7981 # Number of instructions issued
system.cpu.iq.ISSUE:rate 0.865993 # Inst issue rate
system.cpu.iq.iqInstsAdded 9166 # Number of instructions added to the IQ (excludes non-spec)
system.cpu.iq.iqInstsIssued 7968 # Number of instructions issued
system.cpu.iq.iqNonSpecInstsAdded 22 # Number of non-speculative instructions added to the IQ
system.cpu.iq.iqSquashedInstsExamined 3171 # Number of squashed instructions iterated over during squash; mainly for profiling
system.cpu.iq.iqSquashedInstsExamined 3154 # Number of squashed instructions iterated over during squash; mainly for profiling
system.cpu.iq.iqSquashedInstsIssued 22 # Number of squashed instructions issued
system.cpu.iq.iqSquashedNonSpecRemoved 5 # Number of squashed non-spec instructions that were removed
system.cpu.iq.iqSquashedOperandsExamined 2045 # Number of squashed operands that are examined and possibly removed from graph
system.cpu.iq.iqSquashedOperandsExamined 2035 # Number of squashed operands that are examined and possibly removed from graph
system.cpu.l2cache.ReadReq_accesses 483 # number of ReadReq accesses(hits+misses)
system.cpu.l2cache.ReadReq_avg_miss_latency 4639.751553 # average ReadReq miss latency
system.cpu.l2cache.ReadReq_avg_mshr_miss_latency 2463.768116 # average ReadReq mshr miss latency
system.cpu.l2cache.ReadReq_miss_latency 2241000 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_avg_miss_latency 4644.927536 # average ReadReq miss latency
system.cpu.l2cache.ReadReq_avg_mshr_miss_latency 2467.908903 # average ReadReq mshr miss latency
system.cpu.l2cache.ReadReq_miss_latency 2243500 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_rate 1 # miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_misses 483 # number of ReadReq misses
system.cpu.l2cache.ReadReq_mshr_miss_latency 1190000 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_latency 1192000 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_rate 1 # mshr miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_mshr_misses 483 # number of ReadReq MSHR misses
system.cpu.l2cache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
@ -342,29 +343,29 @@ system.cpu.l2cache.blocked_cycles_no_mshrs 0 #
system.cpu.l2cache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.l2cache.cache_copies 0 # number of cache copies performed
system.cpu.l2cache.demand_accesses 483 # number of demand (read+write) accesses
system.cpu.l2cache.demand_avg_miss_latency 4639.751553 # average overall miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency 2463.768116 # average overall mshr miss latency
system.cpu.l2cache.demand_avg_miss_latency 4644.927536 # average overall miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency 2467.908903 # average overall mshr miss latency
system.cpu.l2cache.demand_hits 0 # number of demand (read+write) hits
system.cpu.l2cache.demand_miss_latency 2241000 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_latency 2243500 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_rate 1 # miss rate for demand accesses
system.cpu.l2cache.demand_misses 483 # number of demand (read+write) misses
system.cpu.l2cache.demand_mshr_hits 0 # number of demand (read+write) MSHR hits
system.cpu.l2cache.demand_mshr_miss_latency 1190000 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_latency 1192000 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_rate 1 # mshr miss rate for demand accesses
system.cpu.l2cache.demand_mshr_misses 483 # number of demand (read+write) MSHR misses
system.cpu.l2cache.fast_writes 0 # number of fast writes performed
system.cpu.l2cache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.l2cache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.l2cache.overall_accesses 483 # number of overall (read+write) accesses
system.cpu.l2cache.overall_avg_miss_latency 4639.751553 # average overall miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency 2463.768116 # average overall mshr miss latency
system.cpu.l2cache.overall_avg_miss_latency 4644.927536 # average overall miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency 2467.908903 # average overall mshr miss latency
system.cpu.l2cache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.l2cache.overall_hits 0 # number of overall hits
system.cpu.l2cache.overall_miss_latency 2241000 # number of overall miss cycles
system.cpu.l2cache.overall_miss_latency 2243500 # number of overall miss cycles
system.cpu.l2cache.overall_miss_rate 1 # miss rate for overall accesses
system.cpu.l2cache.overall_misses 483 # number of overall misses
system.cpu.l2cache.overall_mshr_hits 0 # number of overall MSHR hits
system.cpu.l2cache.overall_mshr_miss_latency 1190000 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_latency 1192000 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_rate 1 # mshr miss rate for overall accesses
system.cpu.l2cache.overall_mshr_misses 483 # number of overall MSHR misses
system.cpu.l2cache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
@ -381,27 +382,27 @@ system.cpu.l2cache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.l2cache.replacements 0 # number of replacements
system.cpu.l2cache.sampled_refs 483 # Sample count of references to valid blocks.
system.cpu.l2cache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.l2cache.tagsinuse 278.222582 # Cycle average of tags in use
system.cpu.l2cache.tagsinuse 278.204751 # Cycle average of tags in use
system.cpu.l2cache.total_refs 0 # Total number of references to valid blocks.
system.cpu.l2cache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.l2cache.writebacks 0 # number of writebacks
system.cpu.numCycles 9197 # number of cpu cycles simulated
system.cpu.numCycles 9201 # number of cpu cycles simulated
system.cpu.rename.RENAME:BlockCycles 15 # Number of cycles rename is blocking
system.cpu.rename.RENAME:CommittedMaps 4051 # Number of HB maps that are committed
system.cpu.rename.RENAME:IdleCycles 6383 # Number of cycles rename is idle
system.cpu.rename.RENAME:IdleCycles 6382 # Number of cycles rename is idle
system.cpu.rename.RENAME:LSQFullEvents 70 # Number of times rename has blocked due to LSQ full
system.cpu.rename.RENAME:RenameLookups 12854 # Number of register rename lookups that rename has made
system.cpu.rename.RENAME:RenamedInsts 10031 # Number of instructions processed by rename
system.cpu.rename.RENAME:RenamedOperands 7485 # Number of destination operands rename has renamed
system.cpu.rename.RENAME:RunCycles 1746 # Number of cycles rename is running
system.cpu.rename.RENAME:SquashCycles 682 # Number of cycles rename is squashing
system.cpu.rename.RENAME:RenameLookups 12837 # Number of register rename lookups that rename has made
system.cpu.rename.RENAME:RenamedInsts 10018 # Number of instructions processed by rename
system.cpu.rename.RENAME:RenamedOperands 7477 # Number of destination operands rename has renamed
system.cpu.rename.RENAME:RunCycles 1754 # Number of cycles rename is running
system.cpu.rename.RENAME:SquashCycles 679 # Number of cycles rename is squashing
system.cpu.rename.RENAME:UnblockCycles 101 # Number of cycles rename is unblocking
system.cpu.rename.RENAME:UndoneMaps 3434 # Number of HB maps that are undone due to squashing
system.cpu.rename.RENAME:UndoneMaps 3426 # Number of HB maps that are undone due to squashing
system.cpu.rename.RENAME:serializeStallCycles 270 # count of cycles rename stalled for serializing inst
system.cpu.rename.RENAME:serializingInsts 26 # count of serializing insts renamed
system.cpu.rename.RENAME:skidInsts 380 # count of insts added to the skid buffer
system.cpu.rename.RENAME:tempSerializingInsts 20 # count of temporary serializing insts renamed
system.cpu.timesIdled 25 # Number of times that the entire CPU went into an idle state and unscheduled itself
system.cpu.timesIdled 26 # Number of times that the entire CPU went into an idle state and unscheduled itself
system.cpu.workload.PROG:num_syscalls 17 # Number of system calls
---------- End Simulation Statistics ----------

View file

@ -6,9 +6,9 @@ The Regents of The University of Michigan
All Rights Reserved
M5 compiled Jun 10 2007 14:06:20
M5 started Sun Jun 10 14:22:32 2007
M5 executing on iceaxe
command line: /Users/nate/build/outgoing/build/ALPHA_SE/m5.debug -d /Users/nate/build/outgoing/build/ALPHA_SE/tests/debug/quick/00.hello/alpha/linux/o3-timing tests/run.py quick/00.hello/alpha/linux/o3-timing
M5 compiled Jun 21 2007 21:25:27
M5 started Fri Jun 22 00:04:38 2007
M5 executing on zizzer.eecs.umich.edu
command line: build/ALPHA_SE/m5.fast -d build/ALPHA_SE/tests/fast/quick/00.hello/alpha/linux/o3-timing tests/run.py quick/00.hello/alpha/linux/o3-timing
Global frequency set at 1000000000000 ticks per second
Exiting @ tick 4588000 because target called exit()
Exiting @ tick 4589500 because target called exit()

View file

@ -21,6 +21,7 @@ SQEntries=32
SSITSize=1024
activity=0
backComSize=5
cachePorts=200
choiceCtrBits=2
choicePredictorSize=8192
clock=500
@ -74,6 +75,15 @@ renameToFetchDelay=1
renameToIEWDelay=2
renameToROBDelay=1
renameWidth=8
smtCommitPolicy=RoundRobin
smtFetchPolicy=SingleThread
smtIQPolicy=Partitioned
smtIQThreshold=100
smtLSQPolicy=Partitioned
smtLSQThreshold=100
smtNumFetchingThreads=1
smtROBPolicy=Partitioned
smtROBThreshold=100
squashWidth=8
system=system
trapLatency=13
@ -86,6 +96,7 @@ icache_port=system.cpu.icache.cpu_side
[system.cpu.dcache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -261,6 +272,7 @@ opLat=3
[system.cpu.icache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -299,6 +311,7 @@ mem_side=system.cpu.toL2Bus.port[0]
[system.cpu.l2cache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false

View file

@ -8,9 +8,10 @@ global.BPredUnit.condIncorrect 208 # Nu
global.BPredUnit.condPredicted 376 # Number of conditional branches predicted
global.BPredUnit.lookups 738 # Number of BP lookups
global.BPredUnit.usedRAS 140 # Number of times the RAS was used to get a target.
host_inst_rate 8881 # Simulator instruction rate (inst/s)
host_seconds 0.27 # Real time elapsed on the host
host_tick_rate 7632084 # Simulator tick rate (ticks/s)
host_inst_rate 39805 # Simulator instruction rate (inst/s)
host_mem_usage 153128 # Number of bytes of host memory used
host_seconds 0.06 # Real time elapsed on the host
host_tick_rate 34110715 # Simulator tick rate (ticks/s)
memdepunit.memDep.conflictingLoads 8 # Number of conflicting loads.
memdepunit.memDep.conflictingStores 7 # Number of conflicting stores.
memdepunit.memDep.insertedLoads 608 # Number of loads inserted to the mem dependence unit.
@ -18,22 +19,22 @@ memdepunit.memDep.insertedStores 357 # Nu
sim_freq 1000000000000 # Frequency of simulated ticks
sim_insts 2387 # Number of instructions simulated
sim_seconds 0.000002 # Number of seconds simulated
sim_ticks 2053000 # Number of ticks simulated
sim_ticks 2055000 # Number of ticks simulated
system.cpu.commit.COM:branches 396 # Number of branches committed
system.cpu.commit.COM:bw_lim_events 41 # number cycles where commit BW limit reached
system.cpu.commit.COM:bw_limited 0 # number of insts not committed due to BW limits
system.cpu.commit.COM:committed_per_cycle.start_dist # Number of insts commited each cycle
system.cpu.commit.COM:committed_per_cycle.samples 3906
system.cpu.commit.COM:committed_per_cycle.samples 3910
system.cpu.commit.COM:committed_per_cycle.min_value 0
0 2949 7549.92%
1 266 681.00%
2 333 852.53%
3 131 335.38%
4 74 189.45%
5 64 163.85%
6 29 74.24%
7 19 48.64%
8 41 104.97%
0 2950 7544.76%
1 266 680.31%
2 336 859.34%
3 131 335.04%
4 76 194.37%
5 65 166.24%
6 27 69.05%
7 18 46.04%
8 41 104.86%
system.cpu.commit.COM:committed_per_cycle.max_value 8
system.cpu.commit.COM:committed_per_cycle.end_dist
@ -48,17 +49,17 @@ system.cpu.commit.commitNonSpecStalls 4 # Th
system.cpu.commit.commitSquashedInsts 978 # The number of squashed insts skipped by commit
system.cpu.committedInsts 2387 # Number of Instructions Simulated
system.cpu.committedInsts_total 2387 # Number of Instructions Simulated
system.cpu.cpi 1.721408 # CPI: Cycles Per Instruction
system.cpu.cpi_total 1.721408 # CPI: Total CPI of All Threads
system.cpu.cpi 1.723083 # CPI: Cycles Per Instruction
system.cpu.cpi_total 1.723083 # CPI: Total CPI of All Threads
system.cpu.dcache.ReadReq_accesses 514 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_avg_miss_latency 5456.521739 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency 4737.288136 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_avg_miss_latency 5391.304348 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency 4669.491525 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_hits 445 # number of ReadReq hits
system.cpu.dcache.ReadReq_miss_latency 376500 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_latency 372000 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_rate 0.134241 # miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_misses 69 # number of ReadReq misses
system.cpu.dcache.ReadReq_mshr_hits 10 # number of ReadReq MSHR hits
system.cpu.dcache.ReadReq_mshr_miss_latency 279500 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_latency 275500 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_rate 0.114786 # mshr miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_mshr_misses 59 # number of ReadReq MSHR misses
system.cpu.dcache.WriteReq_accesses 294 # number of WriteReq accesses(hits+misses)
@ -81,29 +82,29 @@ system.cpu.dcache.blocked_cycles_no_mshrs 0 # n
system.cpu.dcache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.cache_copies 0 # number of cache copies performed
system.cpu.dcache.demand_accesses 808 # number of demand (read+write) accesses
system.cpu.dcache.demand_avg_miss_latency 5564.285714 # average overall miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency 4821.428571 # average overall mshr miss latency
system.cpu.dcache.demand_avg_miss_latency 5532.142857 # average overall miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency 4773.809524 # average overall mshr miss latency
system.cpu.dcache.demand_hits 668 # number of demand (read+write) hits
system.cpu.dcache.demand_miss_latency 779000 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_latency 774500 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_rate 0.173267 # miss rate for demand accesses
system.cpu.dcache.demand_misses 140 # number of demand (read+write) misses
system.cpu.dcache.demand_mshr_hits 56 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_miss_latency 405000 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_latency 401000 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_rate 0.103960 # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_misses 84 # number of demand (read+write) MSHR misses
system.cpu.dcache.fast_writes 0 # number of fast writes performed
system.cpu.dcache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.dcache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.dcache.overall_accesses 808 # number of overall (read+write) accesses
system.cpu.dcache.overall_avg_miss_latency 5564.285714 # average overall miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency 4821.428571 # average overall mshr miss latency
system.cpu.dcache.overall_avg_miss_latency 5532.142857 # average overall miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency 4773.809524 # average overall mshr miss latency
system.cpu.dcache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.dcache.overall_hits 668 # number of overall hits
system.cpu.dcache.overall_miss_latency 779000 # number of overall miss cycles
system.cpu.dcache.overall_miss_latency 774500 # number of overall miss cycles
system.cpu.dcache.overall_miss_rate 0.173267 # miss rate for overall accesses
system.cpu.dcache.overall_misses 140 # number of overall misses
system.cpu.dcache.overall_mshr_hits 56 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_miss_latency 405000 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_latency 401000 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_rate 0.103960 # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_misses 84 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
@ -120,7 +121,7 @@ system.cpu.dcache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.dcache.replacements 0 # number of replacements
system.cpu.dcache.sampled_refs 84 # Sample count of references to valid blocks.
system.cpu.dcache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.dcache.tagsinuse 51.851940 # Cycle average of tags in use
system.cpu.dcache.tagsinuse 51.873008 # Cycle average of tags in use
system.cpu.dcache.total_refs 668 # Total number of references to valid blocks.
system.cpu.dcache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.dcache.writebacks 0 # number of writebacks
@ -129,43 +130,43 @@ system.cpu.decode.DECODE:BranchMispred 81 # Nu
system.cpu.decode.DECODE:BranchResolved 123 # Number of times decode resolved a branch
system.cpu.decode.DECODE:DecodedInsts 4033 # Number of instructions handled by decode
system.cpu.decode.DECODE:IdleCycles 3045 # Number of cycles decode is idle
system.cpu.decode.DECODE:RunCycles 767 # Number of cycles decode is running
system.cpu.decode.DECODE:RunCycles 771 # Number of cycles decode is running
system.cpu.decode.DECODE:SquashCycles 202 # Number of cycles decode is squashing
system.cpu.decode.DECODE:SquashedInsts 298 # Number of squashed instructions handled by decode
system.cpu.fetch.Branches 738 # Number of branches that fetch encountered
system.cpu.fetch.CacheLines 654 # Number of cache lines fetched
system.cpu.fetch.Cycles 1440 # Number of cycles fetch has run and was not squashing or blocked
system.cpu.fetch.Cycles 1444 # Number of cycles fetch has run and was not squashing or blocked
system.cpu.fetch.IcacheSquashes 120 # Number of outstanding Icache misses that were squashed
system.cpu.fetch.Insts 4685 # Number of instructions fetch has processed
system.cpu.fetch.SquashCycles 218 # Number of cycles fetch has spent squashing
system.cpu.fetch.branchRate 0.179606 # Number of branch fetches per cycle
system.cpu.fetch.branchRate 0.179431 # Number of branch fetches per cycle
system.cpu.fetch.icacheStallCycles 654 # Number of cycles fetch is stalled on an Icache miss
system.cpu.fetch.predictedBranches 272 # Number of branches that fetch has predicted taken
system.cpu.fetch.rate 1.140180 # Number of inst fetches per cycle
system.cpu.fetch.rate 1.139071 # Number of inst fetches per cycle
system.cpu.fetch.rateDist.start_dist # Number of instructions fetched each cycle (Total)
system.cpu.fetch.rateDist.samples 4109
system.cpu.fetch.rateDist.samples 4113
system.cpu.fetch.rateDist.min_value 0
0 3325 8091.99%
1 32 77.88%
2 74 180.09%
3 53 128.99%
4 99 240.93%
5 49 119.25%
6 38 92.48%
7 35 85.18%
8 404 983.21%
0 3325 8084.12%
1 32 77.80%
2 80 194.51%
3 50 121.57%
4 99 240.70%
5 52 126.43%
6 39 94.82%
7 35 85.10%
8 401 974.96%
system.cpu.fetch.rateDist.max_value 8
system.cpu.fetch.rateDist.end_dist
system.cpu.icache.ReadReq_accesses 654 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_avg_miss_latency 5296.019900 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency 4553.763441 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_avg_miss_latency 5298.507463 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency 4556.451613 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_hits 453 # number of ReadReq hits
system.cpu.icache.ReadReq_miss_latency 1064500 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_latency 1065000 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_rate 0.307339 # miss rate for ReadReq accesses
system.cpu.icache.ReadReq_misses 201 # number of ReadReq misses
system.cpu.icache.ReadReq_mshr_hits 15 # number of ReadReq MSHR hits
system.cpu.icache.ReadReq_mshr_miss_latency 847000 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_latency 847500 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_rate 0.284404 # mshr miss rate for ReadReq accesses
system.cpu.icache.ReadReq_mshr_misses 186 # number of ReadReq MSHR misses
system.cpu.icache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
@ -177,29 +178,29 @@ system.cpu.icache.blocked_cycles_no_mshrs 0 # n
system.cpu.icache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.icache.cache_copies 0 # number of cache copies performed
system.cpu.icache.demand_accesses 654 # number of demand (read+write) accesses
system.cpu.icache.demand_avg_miss_latency 5296.019900 # average overall miss latency
system.cpu.icache.demand_avg_mshr_miss_latency 4553.763441 # average overall mshr miss latency
system.cpu.icache.demand_avg_miss_latency 5298.507463 # average overall miss latency
system.cpu.icache.demand_avg_mshr_miss_latency 4556.451613 # average overall mshr miss latency
system.cpu.icache.demand_hits 453 # number of demand (read+write) hits
system.cpu.icache.demand_miss_latency 1064500 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_latency 1065000 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_rate 0.307339 # miss rate for demand accesses
system.cpu.icache.demand_misses 201 # number of demand (read+write) misses
system.cpu.icache.demand_mshr_hits 15 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_miss_latency 847000 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_latency 847500 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_rate 0.284404 # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_misses 186 # number of demand (read+write) MSHR misses
system.cpu.icache.fast_writes 0 # number of fast writes performed
system.cpu.icache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.icache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.icache.overall_accesses 654 # number of overall (read+write) accesses
system.cpu.icache.overall_avg_miss_latency 5296.019900 # average overall miss latency
system.cpu.icache.overall_avg_mshr_miss_latency 4553.763441 # average overall mshr miss latency
system.cpu.icache.overall_avg_miss_latency 5298.507463 # average overall miss latency
system.cpu.icache.overall_avg_mshr_miss_latency 4556.451613 # average overall mshr miss latency
system.cpu.icache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.icache.overall_hits 453 # number of overall hits
system.cpu.icache.overall_miss_latency 1064500 # number of overall miss cycles
system.cpu.icache.overall_miss_latency 1065000 # number of overall miss cycles
system.cpu.icache.overall_miss_rate 0.307339 # miss rate for overall accesses
system.cpu.icache.overall_misses 201 # number of overall misses
system.cpu.icache.overall_mshr_hits 15 # number of overall MSHR hits
system.cpu.icache.overall_mshr_miss_latency 847000 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_latency 847500 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_rate 0.284404 # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_misses 186 # number of overall MSHR misses
system.cpu.icache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
@ -216,14 +217,14 @@ system.cpu.icache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.icache.replacements 0 # number of replacements
system.cpu.icache.sampled_refs 186 # Sample count of references to valid blocks.
system.cpu.icache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.icache.tagsinuse 106.237740 # Cycle average of tags in use
system.cpu.icache.tagsinuse 106.293956 # Cycle average of tags in use
system.cpu.icache.total_refs 453 # Total number of references to valid blocks.
system.cpu.icache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.icache.writebacks 0 # number of writebacks
system.cpu.idleCycles 2992 # Total number of cycles that the CPU has spent unscheduled due to idling
system.cpu.iew.EXEC:branches 501 # Number of branches executed
system.cpu.iew.EXEC:nop 234 # number of nop insts executed
system.cpu.iew.EXEC:rate 0.727184 # Inst execution rate
system.cpu.iew.EXEC:rate 0.726477 # Inst execution rate
system.cpu.iew.EXEC:refs 878 # number of memory reference insts executed
system.cpu.iew.EXEC:stores 333 # Number of stores executed
system.cpu.iew.EXEC:swp 0 # number of swp insts executed
@ -233,7 +234,7 @@ system.cpu.iew.WB:fanout 0.799637 # av
system.cpu.iew.WB:penalized 0 # number of instrctions required to write to 'other' IQ
system.cpu.iew.WB:penalized_rate 0 # fraction of instructions written-back that wrote to 'other' IQ
system.cpu.iew.WB:producers 1321 # num instructions producing a value
system.cpu.iew.WB:rate 0.709175 # insts written-back per cycle
system.cpu.iew.WB:rate 0.708485 # insts written-back per cycle
system.cpu.iew.WB:sent 2931 # cumulative count of insts sent to commit
system.cpu.iew.branchMispredicts 135 # Number of branch mispredicts detected at execute
system.cpu.iew.iewBlockCycles 0 # Number of cycles IEW is blocking
@ -263,8 +264,8 @@ system.cpu.iew.lsq.thread.0.squashedStores 63 #
system.cpu.iew.memOrderViolationEvents 10 # Number of memory order violations
system.cpu.iew.predictedNotTakenIncorrect 98 # Number of branches that were predicted not taken incorrectly
system.cpu.iew.predictedTakenIncorrect 37 # Number of branches that were predicted taken incorrectly
system.cpu.ipc 0.580920 # IPC: Instructions Per Cycle
system.cpu.ipc_total 0.580920 # IPC: Total IPC of All Threads
system.cpu.ipc 0.580355 # IPC: Instructions Per Cycle
system.cpu.ipc_total 0.580355 # IPC: Total IPC of All Threads
system.cpu.iq.ISSUE:FU_type_0 3075 # Type of FU issued
system.cpu.iq.ISSUE:FU_type_0.start_dist
No_OpClass 0 0.00% # Type of FU issued
@ -301,21 +302,21 @@ system.cpu.iq.ISSUE:fu_full.start_dist
InstPrefetch 0 0.00% # attempts to use FU when none available
system.cpu.iq.ISSUE:fu_full.end_dist
system.cpu.iq.ISSUE:issued_per_cycle.start_dist # Number of insts issued each cycle
system.cpu.iq.ISSUE:issued_per_cycle.samples 4109
system.cpu.iq.ISSUE:issued_per_cycle.samples 4113
system.cpu.iq.ISSUE:issued_per_cycle.min_value 0
0 2849 6933.56%
1 475 1156.00%
2 270 657.09%
3 217 528.11%
4 159 386.96%
5 86 209.30%
6 34 82.75%
7 13 31.64%
8 6 14.60%
0 2848 6924.39%
1 479 1164.60%
2 276 671.04%
3 213 517.87%
4 158 384.15%
5 86 209.09%
6 34 82.66%
7 13 31.61%
8 6 14.59%
system.cpu.iq.ISSUE:issued_per_cycle.max_value 8
system.cpu.iq.ISSUE:issued_per_cycle.end_dist
system.cpu.iq.ISSUE:rate 0.748357 # Inst issue rate
system.cpu.iq.ISSUE:rate 0.747629 # Inst issue rate
system.cpu.iq.iqInstsAdded 3330 # Number of instructions added to the IQ (excludes non-spec)
system.cpu.iq.iqInstsIssued 3075 # Number of instructions issued
system.cpu.iq.iqNonSpecInstsAdded 7 # Number of non-speculative instructions added to the IQ
@ -323,9 +324,9 @@ system.cpu.iq.iqSquashedInstsExamined 790 # Nu
system.cpu.iq.iqSquashedNonSpecRemoved 3 # Number of squashed non-spec instructions that were removed
system.cpu.iq.iqSquashedOperandsExamined 409 # Number of squashed operands that are examined and possibly removed from graph
system.cpu.l2cache.ReadReq_accesses 270 # number of ReadReq accesses(hits+misses)
system.cpu.l2cache.ReadReq_avg_miss_latency 4522.222222 # average ReadReq miss latency
system.cpu.l2cache.ReadReq_avg_miss_latency 4509.259259 # average ReadReq miss latency
system.cpu.l2cache.ReadReq_avg_mshr_miss_latency 2388.888889 # average ReadReq mshr miss latency
system.cpu.l2cache.ReadReq_miss_latency 1221000 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_latency 1217500 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_rate 1 # miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_misses 270 # number of ReadReq misses
system.cpu.l2cache.ReadReq_mshr_miss_latency 645000 # number of ReadReq MSHR miss cycles
@ -340,10 +341,10 @@ system.cpu.l2cache.blocked_cycles_no_mshrs 0 #
system.cpu.l2cache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.l2cache.cache_copies 0 # number of cache copies performed
system.cpu.l2cache.demand_accesses 270 # number of demand (read+write) accesses
system.cpu.l2cache.demand_avg_miss_latency 4522.222222 # average overall miss latency
system.cpu.l2cache.demand_avg_miss_latency 4509.259259 # average overall miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency 2388.888889 # average overall mshr miss latency
system.cpu.l2cache.demand_hits 0 # number of demand (read+write) hits
system.cpu.l2cache.demand_miss_latency 1221000 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_latency 1217500 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_rate 1 # miss rate for demand accesses
system.cpu.l2cache.demand_misses 270 # number of demand (read+write) misses
system.cpu.l2cache.demand_mshr_hits 0 # number of demand (read+write) MSHR hits
@ -354,11 +355,11 @@ system.cpu.l2cache.fast_writes 0 # nu
system.cpu.l2cache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.l2cache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.l2cache.overall_accesses 270 # number of overall (read+write) accesses
system.cpu.l2cache.overall_avg_miss_latency 4522.222222 # average overall miss latency
system.cpu.l2cache.overall_avg_miss_latency 4509.259259 # average overall miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency 2388.888889 # average overall mshr miss latency
system.cpu.l2cache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.l2cache.overall_hits 0 # number of overall hits
system.cpu.l2cache.overall_miss_latency 1221000 # number of overall miss cycles
system.cpu.l2cache.overall_miss_latency 1217500 # number of overall miss cycles
system.cpu.l2cache.overall_miss_rate 1 # miss rate for overall accesses
system.cpu.l2cache.overall_misses 270 # number of overall misses
system.cpu.l2cache.overall_mshr_hits 0 # number of overall MSHR hits
@ -379,18 +380,18 @@ system.cpu.l2cache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.l2cache.replacements 0 # number of replacements
system.cpu.l2cache.sampled_refs 270 # Sample count of references to valid blocks.
system.cpu.l2cache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.l2cache.tagsinuse 158.236294 # Cycle average of tags in use
system.cpu.l2cache.tagsinuse 158.313436 # Cycle average of tags in use
system.cpu.l2cache.total_refs 0 # Total number of references to valid blocks.
system.cpu.l2cache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.l2cache.writebacks 0 # number of writebacks
system.cpu.numCycles 4109 # number of cpu cycles simulated
system.cpu.numCycles 4113 # number of cpu cycles simulated
system.cpu.rename.RENAME:CommittedMaps 1768 # Number of HB maps that are committed
system.cpu.rename.RENAME:IdleCycles 3116 # Number of cycles rename is idle
system.cpu.rename.RENAME:LSQFullEvents 1 # Number of times rename has blocked due to LSQ full
system.cpu.rename.RENAME:RenameLookups 4416 # Number of register rename lookups that rename has made
system.cpu.rename.RENAME:RenamedInsts 3886 # Number of instructions processed by rename
system.cpu.rename.RENAME:RenamedOperands 2777 # Number of destination operands rename has renamed
system.cpu.rename.RENAME:RunCycles 696 # Number of cycles rename is running
system.cpu.rename.RENAME:RunCycles 700 # Number of cycles rename is running
system.cpu.rename.RENAME:SquashCycles 202 # Number of cycles rename is squashing
system.cpu.rename.RENAME:UnblockCycles 6 # Number of cycles rename is unblocking
system.cpu.rename.RENAME:UndoneMaps 1009 # Number of HB maps that are undone due to squashing

View file

@ -6,9 +6,9 @@ The Regents of The University of Michigan
All Rights Reserved
M5 compiled Jun 10 2007 14:06:20
M5 started Sun Jun 10 14:22:36 2007
M5 executing on iceaxe
command line: /Users/nate/build/outgoing/build/ALPHA_SE/m5.debug -d /Users/nate/build/outgoing/build/ALPHA_SE/tests/debug/quick/00.hello/alpha/tru64/o3-timing tests/run.py quick/00.hello/alpha/tru64/o3-timing
M5 compiled Jun 21 2007 21:25:27
M5 started Fri Jun 22 00:04:44 2007
M5 executing on zizzer.eecs.umich.edu
command line: build/ALPHA_SE/m5.fast -d build/ALPHA_SE/tests/fast/quick/00.hello/alpha/tru64/o3-timing tests/run.py quick/00.hello/alpha/tru64/o3-timing
Global frequency set at 1000000000000 ticks per second
Exiting @ tick 2053000 because target called exit()
Exiting @ tick 2055000 because target called exit()

View file

@ -21,6 +21,7 @@ SQEntries=32
SSITSize=1024
activity=0
backComSize=5
cachePorts=200
choiceCtrBits=2
choicePredictorSize=8192
clock=500
@ -74,6 +75,15 @@ renameToFetchDelay=1
renameToIEWDelay=2
renameToROBDelay=1
renameWidth=8
smtCommitPolicy=RoundRobin
smtFetchPolicy=SingleThread
smtIQPolicy=Partitioned
smtIQThreshold=100
smtLSQPolicy=Partitioned
smtLSQThreshold=100
smtNumFetchingThreads=1
smtROBPolicy=Partitioned
smtROBThreshold=100
squashWidth=8
system=system
trapLatency=13
@ -86,6 +96,7 @@ icache_port=system.cpu.icache.cpu_side
[system.cpu.dcache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -261,6 +272,7 @@ opLat=3
[system.cpu.icache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -299,6 +311,7 @@ mem_side=system.cpu.toL2Bus.port[0]
[system.cpu.l2cache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false

View file

@ -1,47 +1,48 @@
---------- Begin Simulation Statistics ----------
global.BPredUnit.BTBCorrect 0 # Number of correct BTB predictions (this stat may not work properly.
global.BPredUnit.BTBHits 674 # Number of BTB hits
global.BPredUnit.BTBLookups 3410 # Number of BTB lookups
global.BPredUnit.RASInCorrect 118 # Number of incorrect RAS predictions.
global.BPredUnit.condIncorrect 1115 # Number of conditional branches incorrect
global.BPredUnit.condPredicted 2318 # Number of conditional branches predicted
global.BPredUnit.lookups 3964 # Number of BP lookups
global.BPredUnit.usedRAS 532 # Number of times the RAS was used to get a target.
host_inst_rate 8215 # Simulator instruction rate (inst/s)
host_seconds 1.37 # Real time elapsed on the host
host_tick_rate 4009351 # Simulator tick rate (ticks/s)
memdepunit.memDep.conflictingLoads 19 # Number of conflicting loads.
memdepunit.memDep.conflictingLoads 18 # Number of conflicting loads.
memdepunit.memDep.conflictingStores 54 # Number of conflicting stores.
global.BPredUnit.BTBHits 696 # Number of BTB hits
global.BPredUnit.BTBLookups 3414 # Number of BTB lookups
global.BPredUnit.RASInCorrect 125 # Number of incorrect RAS predictions.
global.BPredUnit.condIncorrect 1124 # Number of conditional branches incorrect
global.BPredUnit.condPredicted 2315 # Number of conditional branches predicted
global.BPredUnit.lookups 3940 # Number of BP lookups
global.BPredUnit.usedRAS 525 # Number of times the RAS was used to get a target.
host_inst_rate 52706 # Simulator instruction rate (inst/s)
host_mem_usage 154396 # Number of bytes of host memory used
host_seconds 0.21 # Real time elapsed on the host
host_tick_rate 25698682 # Simulator tick rate (ticks/s)
memdepunit.memDep.conflictingLoads 16 # Number of conflicting loads.
memdepunit.memDep.conflictingLoads 16 # Number of conflicting loads.
memdepunit.memDep.conflictingStores 53 # Number of conflicting stores.
memdepunit.memDep.conflictingStores 59 # Number of conflicting stores.
memdepunit.memDep.insertedLoads 1925 # Number of loads inserted to the mem dependence unit.
memdepunit.memDep.insertedLoads 1898 # Number of loads inserted to the mem dependence unit.
memdepunit.memDep.insertedStores 1088 # Number of stores inserted to the mem dependence unit.
memdepunit.memDep.insertedLoads 1934 # Number of loads inserted to the mem dependence unit.
memdepunit.memDep.insertedLoads 1903 # Number of loads inserted to the mem dependence unit.
memdepunit.memDep.insertedStores 1082 # Number of stores inserted to the mem dependence unit.
memdepunit.memDep.insertedStores 1090 # Number of stores inserted to the mem dependence unit.
sim_freq 1000000000000 # Frequency of simulated ticks
sim_insts 11247 # Number of instructions simulated
sim_seconds 0.000005 # Number of seconds simulated
sim_ticks 5490000 # Number of ticks simulated
sim_ticks 5491500 # Number of ticks simulated
system.cpu.commit.COM:branches 1724 # Number of branches committed
system.cpu.commit.COM:branches_0 862 # Number of branches committed
system.cpu.commit.COM:branches_1 862 # Number of branches committed
system.cpu.commit.COM:bw_lim_events 165 # number cycles where commit BW limit reached
system.cpu.commit.COM:bw_lim_events 168 # number cycles where commit BW limit reached
system.cpu.commit.COM:bw_limited 0 # number of insts not committed due to BW limits
system.cpu.commit.COM:bw_limited_0 0 # number of insts not committed due to BW limits
system.cpu.commit.COM:bw_limited_1 0 # number of insts not committed due to BW limits
system.cpu.commit.COM:committed_per_cycle.start_dist # Number of insts commited each cycle
system.cpu.commit.COM:committed_per_cycle.samples 10929
system.cpu.commit.COM:committed_per_cycle.samples 10926
system.cpu.commit.COM:committed_per_cycle.min_value 0
0 6410 5865.13%
1 2019 1847.38%
2 999 914.08%
3 454 415.41%
4 300 274.50%
5 246 225.09%
6 200 183.00%
7 136 124.44%
8 165 150.97%
0 6353 5814.57%
1 2078 1901.89%
2 996 911.59%
3 472 432.00%
4 296 270.91%
5 241 220.57%
6 192 175.73%
7 130 118.98%
8 168 153.76%
system.cpu.commit.COM:committed_per_cycle.max_value 8
system.cpu.commit.COM:committed_per_cycle.end_dist
@ -60,133 +61,133 @@ system.cpu.commit.COM:refs_1 1791 # Nu
system.cpu.commit.COM:swp_count 0 # Number of s/w prefetches committed
system.cpu.commit.COM:swp_count_0 0 # Number of s/w prefetches committed
system.cpu.commit.COM:swp_count_1 0 # Number of s/w prefetches committed
system.cpu.commit.branchMispredicts 874 # The number of times a branch was mispredicted
system.cpu.commit.branchMispredicts 885 # The number of times a branch was mispredicted
system.cpu.commit.commitCommittedInsts 11281 # The number of committed instructions
system.cpu.commit.commitNonSpecStalls 34 # The number of times commit has been forced to stall to communicate backwards
system.cpu.commit.commitSquashedInsts 7769 # The number of squashed insts skipped by commit
system.cpu.commit.commitSquashedInsts 7777 # The number of squashed insts skipped by commit
system.cpu.committedInsts_0 5623 # Number of Instructions Simulated
system.cpu.committedInsts_1 5624 # Number of Instructions Simulated
system.cpu.committedInsts_total 11247 # Number of Instructions Simulated
system.cpu.cpi_0 1.952516 # CPI: Cycles Per Instruction
system.cpu.cpi_1 1.952169 # CPI: Cycles Per Instruction
system.cpu.cpi_total 0.976171 # CPI: Total CPI of All Threads
system.cpu.dcache.ReadReq_accesses 2969 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_accesses_0 2969 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_avg_miss_latency_0 7072.992701 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency_0 6972.361809 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_hits 2695 # number of ReadReq hits
system.cpu.dcache.ReadReq_hits_0 2695 # number of ReadReq hits
system.cpu.dcache.ReadReq_miss_latency 1938000 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_latency_0 1938000 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_rate_0 0.092287 # miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_misses 274 # number of ReadReq misses
system.cpu.dcache.ReadReq_misses_0 274 # number of ReadReq misses
system.cpu.dcache.ReadReq_mshr_hits 75 # number of ReadReq MSHR hits
system.cpu.dcache.ReadReq_mshr_hits_0 75 # number of ReadReq MSHR hits
system.cpu.dcache.ReadReq_mshr_miss_latency 1387500 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_latency_0 1387500 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_rate_0 0.067026 # mshr miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_mshr_misses 199 # number of ReadReq MSHR misses
system.cpu.dcache.ReadReq_mshr_misses_0 199 # number of ReadReq MSHR misses
system.cpu.cpi_0 1.952872 # CPI: Cycles Per Instruction
system.cpu.cpi_1 1.952525 # CPI: Cycles Per Instruction
system.cpu.cpi_total 0.976349 # CPI: Total CPI of All Threads
system.cpu.dcache.ReadReq_accesses 2981 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_accesses_0 2981 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_avg_miss_latency_0 7040.892193 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency_0 6979.591837 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_hits 2712 # number of ReadReq hits
system.cpu.dcache.ReadReq_hits_0 2712 # number of ReadReq hits
system.cpu.dcache.ReadReq_miss_latency 1894000 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_latency_0 1894000 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_rate_0 0.090238 # miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_misses 269 # number of ReadReq misses
system.cpu.dcache.ReadReq_misses_0 269 # number of ReadReq misses
system.cpu.dcache.ReadReq_mshr_hits 73 # number of ReadReq MSHR hits
system.cpu.dcache.ReadReq_mshr_hits_0 73 # number of ReadReq MSHR hits
system.cpu.dcache.ReadReq_mshr_miss_latency 1368000 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_latency_0 1368000 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_rate_0 0.065750 # mshr miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_mshr_misses 196 # number of ReadReq MSHR misses
system.cpu.dcache.ReadReq_mshr_misses_0 196 # number of ReadReq MSHR misses
system.cpu.dcache.WriteReq_accesses 1624 # number of WriteReq accesses(hits+misses)
system.cpu.dcache.WriteReq_accesses_0 1624 # number of WriteReq accesses(hits+misses)
system.cpu.dcache.WriteReq_avg_miss_latency_0 5352.409639 # average WriteReq miss latency
system.cpu.dcache.WriteReq_avg_mshr_miss_latency_0 5859.589041 # average WriteReq mshr miss latency
system.cpu.dcache.WriteReq_hits 1126 # number of WriteReq hits
system.cpu.dcache.WriteReq_hits_0 1126 # number of WriteReq hits
system.cpu.dcache.WriteReq_miss_latency 2665500 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_latency_0 2665500 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_rate_0 0.306650 # miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_misses 498 # number of WriteReq misses
system.cpu.dcache.WriteReq_misses_0 498 # number of WriteReq misses
system.cpu.dcache.WriteReq_mshr_hits 352 # number of WriteReq MSHR hits
system.cpu.dcache.WriteReq_mshr_hits_0 352 # number of WriteReq MSHR hits
system.cpu.dcache.WriteReq_mshr_miss_latency 855500 # number of WriteReq MSHR miss cycles
system.cpu.dcache.WriteReq_mshr_miss_latency_0 855500 # number of WriteReq MSHR miss cycles
system.cpu.dcache.WriteReq_avg_miss_latency_0 5306.613226 # average WriteReq miss latency
system.cpu.dcache.WriteReq_avg_mshr_miss_latency_0 5852.739726 # average WriteReq mshr miss latency
system.cpu.dcache.WriteReq_hits 1125 # number of WriteReq hits
system.cpu.dcache.WriteReq_hits_0 1125 # number of WriteReq hits
system.cpu.dcache.WriteReq_miss_latency 2648000 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_latency_0 2648000 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_rate_0 0.307266 # miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_misses 499 # number of WriteReq misses
system.cpu.dcache.WriteReq_misses_0 499 # number of WriteReq misses
system.cpu.dcache.WriteReq_mshr_hits 353 # number of WriteReq MSHR hits
system.cpu.dcache.WriteReq_mshr_hits_0 353 # number of WriteReq MSHR hits
system.cpu.dcache.WriteReq_mshr_miss_latency 854500 # number of WriteReq MSHR miss cycles
system.cpu.dcache.WriteReq_mshr_miss_latency_0 854500 # number of WriteReq MSHR miss cycles
system.cpu.dcache.WriteReq_mshr_miss_rate_0 0.089901 # mshr miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_mshr_misses 146 # number of WriteReq MSHR misses
system.cpu.dcache.WriteReq_mshr_misses_0 146 # number of WriteReq MSHR misses
system.cpu.dcache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.dcache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.dcache.avg_refs 11.075362 # Average number of references to valid blocks.
system.cpu.dcache.avg_refs 11.219298 # Average number of references to valid blocks.
system.cpu.dcache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.dcache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.dcache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.cache_copies 0 # number of cache copies performed
system.cpu.dcache.demand_accesses 4593 # number of demand (read+write) accesses
system.cpu.dcache.demand_accesses_0 4593 # number of demand (read+write) accesses
system.cpu.dcache.demand_accesses 4605 # number of demand (read+write) accesses
system.cpu.dcache.demand_accesses_0 4605 # number of demand (read+write) accesses
system.cpu.dcache.demand_accesses_1 0 # number of demand (read+write) accesses
system.cpu.dcache.demand_avg_miss_latency <err: div-0> # average overall miss latency
system.cpu.dcache.demand_avg_miss_latency_0 5963.082902 # average overall miss latency
system.cpu.dcache.demand_avg_miss_latency_0 5914.062500 # average overall miss latency
system.cpu.dcache.demand_avg_miss_latency_1 <err: div-0> # average overall miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency <err: div-0> # average overall mshr miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency_0 6501.449275 # average overall mshr miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency_0 6498.538012 # average overall mshr miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency_1 <err: div-0> # average overall mshr miss latency
system.cpu.dcache.demand_hits 3821 # number of demand (read+write) hits
system.cpu.dcache.demand_hits_0 3821 # number of demand (read+write) hits
system.cpu.dcache.demand_hits 3837 # number of demand (read+write) hits
system.cpu.dcache.demand_hits_0 3837 # number of demand (read+write) hits
system.cpu.dcache.demand_hits_1 0 # number of demand (read+write) hits
system.cpu.dcache.demand_miss_latency 4603500 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_latency_0 4603500 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_latency 4542000 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_latency_0 4542000 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_latency_1 0 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_rate <err: div-0> # miss rate for demand accesses
system.cpu.dcache.demand_miss_rate_0 0.168082 # miss rate for demand accesses
system.cpu.dcache.demand_miss_rate_0 0.166775 # miss rate for demand accesses
system.cpu.dcache.demand_miss_rate_1 <err: div-0> # miss rate for demand accesses
system.cpu.dcache.demand_misses 772 # number of demand (read+write) misses
system.cpu.dcache.demand_misses_0 772 # number of demand (read+write) misses
system.cpu.dcache.demand_misses 768 # number of demand (read+write) misses
system.cpu.dcache.demand_misses_0 768 # number of demand (read+write) misses
system.cpu.dcache.demand_misses_1 0 # number of demand (read+write) misses
system.cpu.dcache.demand_mshr_hits 427 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_hits_0 427 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_hits 426 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_hits_0 426 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_hits_1 0 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_miss_latency 2243000 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_latency_0 2243000 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_latency 2222500 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_latency_0 2222500 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_latency_1 0 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_rate <err: div-0> # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_miss_rate_0 0.075114 # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_miss_rate_0 0.074267 # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_miss_rate_1 <err: div-0> # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_misses 345 # number of demand (read+write) MSHR misses
system.cpu.dcache.demand_mshr_misses_0 345 # number of demand (read+write) MSHR misses
system.cpu.dcache.demand_mshr_misses 342 # number of demand (read+write) MSHR misses
system.cpu.dcache.demand_mshr_misses_0 342 # number of demand (read+write) MSHR misses
system.cpu.dcache.demand_mshr_misses_1 0 # number of demand (read+write) MSHR misses
system.cpu.dcache.fast_writes 0 # number of fast writes performed
system.cpu.dcache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.dcache.mshr_cap_events_0 0 # number of times MSHR cap was activated
system.cpu.dcache.mshr_cap_events_1 0 # number of times MSHR cap was activated
system.cpu.dcache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.dcache.overall_accesses 4593 # number of overall (read+write) accesses
system.cpu.dcache.overall_accesses_0 4593 # number of overall (read+write) accesses
system.cpu.dcache.overall_accesses 4605 # number of overall (read+write) accesses
system.cpu.dcache.overall_accesses_0 4605 # number of overall (read+write) accesses
system.cpu.dcache.overall_accesses_1 0 # number of overall (read+write) accesses
system.cpu.dcache.overall_avg_miss_latency <err: div-0> # average overall miss latency
system.cpu.dcache.overall_avg_miss_latency_0 5963.082902 # average overall miss latency
system.cpu.dcache.overall_avg_miss_latency_0 5914.062500 # average overall miss latency
system.cpu.dcache.overall_avg_miss_latency_1 <err: div-0> # average overall miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency <err: div-0> # average overall mshr miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency_0 6501.449275 # average overall mshr miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency_0 6498.538012 # average overall mshr miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency_1 <err: div-0> # average overall mshr miss latency
system.cpu.dcache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.dcache.overall_avg_mshr_uncacheable_latency_0 <err: div-0> # average overall mshr uncacheable latency
system.cpu.dcache.overall_avg_mshr_uncacheable_latency_1 <err: div-0> # average overall mshr uncacheable latency
system.cpu.dcache.overall_hits 3821 # number of overall hits
system.cpu.dcache.overall_hits_0 3821 # number of overall hits
system.cpu.dcache.overall_hits 3837 # number of overall hits
system.cpu.dcache.overall_hits_0 3837 # number of overall hits
system.cpu.dcache.overall_hits_1 0 # number of overall hits
system.cpu.dcache.overall_miss_latency 4603500 # number of overall miss cycles
system.cpu.dcache.overall_miss_latency_0 4603500 # number of overall miss cycles
system.cpu.dcache.overall_miss_latency 4542000 # number of overall miss cycles
system.cpu.dcache.overall_miss_latency_0 4542000 # number of overall miss cycles
system.cpu.dcache.overall_miss_latency_1 0 # number of overall miss cycles
system.cpu.dcache.overall_miss_rate <err: div-0> # miss rate for overall accesses
system.cpu.dcache.overall_miss_rate_0 0.168082 # miss rate for overall accesses
system.cpu.dcache.overall_miss_rate_0 0.166775 # miss rate for overall accesses
system.cpu.dcache.overall_miss_rate_1 <err: div-0> # miss rate for overall accesses
system.cpu.dcache.overall_misses 772 # number of overall misses
system.cpu.dcache.overall_misses_0 772 # number of overall misses
system.cpu.dcache.overall_misses 768 # number of overall misses
system.cpu.dcache.overall_misses_0 768 # number of overall misses
system.cpu.dcache.overall_misses_1 0 # number of overall misses
system.cpu.dcache.overall_mshr_hits 427 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_hits_0 427 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_hits 426 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_hits_0 426 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_hits_1 0 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_miss_latency 2243000 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_latency_0 2243000 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_latency 2222500 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_latency_0 2222500 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_latency_1 0 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_rate <err: div-0> # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_miss_rate_0 0.075114 # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_miss_rate_0 0.074267 # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_miss_rate_1 <err: div-0> # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_misses 345 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_misses_0 345 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_misses 342 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_misses_0 342 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_misses_1 0 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.dcache.overall_mshr_uncacheable_latency_0 0 # number of overall MSHR uncacheable cycles
@ -206,149 +207,149 @@ system.cpu.dcache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.dcache.replacements 0 # number of replacements
system.cpu.dcache.replacements_0 0 # number of replacements
system.cpu.dcache.replacements_1 0 # number of replacements
system.cpu.dcache.sampled_refs 345 # Sample count of references to valid blocks.
system.cpu.dcache.sampled_refs 342 # Sample count of references to valid blocks.
system.cpu.dcache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.dcache.soft_prefetch_mshr_full_0 0 # number of mshr full events for SW prefetching instrutions
system.cpu.dcache.soft_prefetch_mshr_full_1 0 # number of mshr full events for SW prefetching instrutions
system.cpu.dcache.tagsinuse 221.724795 # Cycle average of tags in use
system.cpu.dcache.total_refs 3821 # Total number of references to valid blocks.
system.cpu.dcache.tagsinuse 221.287284 # Cycle average of tags in use
system.cpu.dcache.total_refs 3837 # Total number of references to valid blocks.
system.cpu.dcache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.dcache.writebacks 0 # number of writebacks
system.cpu.dcache.writebacks_0 0 # number of writebacks
system.cpu.dcache.writebacks_1 0 # number of writebacks
system.cpu.decode.DECODE:BlockedCycles 1857 # Number of cycles decode is blocked
system.cpu.decode.DECODE:BranchMispred 251 # Number of times decode detected a branch misprediction
system.cpu.decode.DECODE:BranchResolved 346 # Number of times decode resolved a branch
system.cpu.decode.DECODE:DecodedInsts 21806 # Number of instructions handled by decode
system.cpu.decode.DECODE:IdleCycles 14535 # Number of cycles decode is idle
system.cpu.decode.DECODE:RunCycles 3658 # Number of cycles decode is running
system.cpu.decode.DECODE:SquashCycles 1498 # Number of cycles decode is squashing
system.cpu.decode.DECODE:SquashedInsts 351 # Number of squashed instructions handled by decode
system.cpu.decode.DECODE:BlockedCycles 1876 # Number of cycles decode is blocked
system.cpu.decode.DECODE:BranchMispred 246 # Number of times decode detected a branch misprediction
system.cpu.decode.DECODE:BranchResolved 345 # Number of times decode resolved a branch
system.cpu.decode.DECODE:DecodedInsts 21769 # Number of instructions handled by decode
system.cpu.decode.DECODE:IdleCycles 14522 # Number of cycles decode is idle
system.cpu.decode.DECODE:RunCycles 3673 # Number of cycles decode is running
system.cpu.decode.DECODE:SquashCycles 1511 # Number of cycles decode is squashing
system.cpu.decode.DECODE:SquashedInsts 346 # Number of squashed instructions handled by decode
system.cpu.decode.DECODE:UnblockCycles 145 # Number of cycles decode is unblocking
system.cpu.fetch.Branches 3964 # Number of branches that fetch encountered
system.cpu.fetch.CacheLines 2983 # Number of cache lines fetched
system.cpu.fetch.Cycles 6940 # Number of cycles fetch has run and was not squashing or blocked
system.cpu.fetch.IcacheSquashes 525 # Number of outstanding Icache misses that were squashed
system.cpu.fetch.Insts 24033 # Number of instructions fetch has processed
system.cpu.fetch.SquashCycles 1178 # Number of cycles fetch has spent squashing
system.cpu.fetch.branchRate 0.361053 # Number of branch fetches per cycle
system.cpu.fetch.icacheStallCycles 2983 # Number of cycles fetch is stalled on an Icache miss
system.cpu.fetch.predictedBranches 1206 # Number of branches that fetch has predicted taken
system.cpu.fetch.rate 2.188997 # Number of inst fetches per cycle
system.cpu.fetch.Branches 3940 # Number of branches that fetch encountered
system.cpu.fetch.CacheLines 3009 # Number of cache lines fetched
system.cpu.fetch.Cycles 6972 # Number of cycles fetch has run and was not squashing or blocked
system.cpu.fetch.IcacheSquashes 537 # Number of outstanding Icache misses that were squashed
system.cpu.fetch.Insts 23897 # Number of instructions fetch has processed
system.cpu.fetch.SquashCycles 1189 # Number of cycles fetch has spent squashing
system.cpu.fetch.branchRate 0.358802 # Number of branch fetches per cycle
system.cpu.fetch.icacheStallCycles 3009 # Number of cycles fetch is stalled on an Icache miss
system.cpu.fetch.predictedBranches 1221 # Number of branches that fetch has predicted taken
system.cpu.fetch.rate 2.176213 # Number of inst fetches per cycle
system.cpu.fetch.rateDist.start_dist # Number of instructions fetched each cycle (Total)
system.cpu.fetch.rateDist.samples 10979
system.cpu.fetch.rateDist.samples 10981
system.cpu.fetch.rateDist.min_value 0
0 7023 6396.76%
1 285 259.59%
2 224 204.03%
3 248 225.89%
4 335 305.13%
5 281 255.94%
6 301 274.16%
7 251 228.62%
8 2031 1849.90%
0 7019 6391.95%
1 293 266.82%
2 225 204.90%
3 260 236.77%
4 345 314.18%
5 288 262.27%
6 304 276.84%
7 246 224.02%
8 2001 1822.24%
system.cpu.fetch.rateDist.max_value 8
system.cpu.fetch.rateDist.end_dist
system.cpu.icache.ReadReq_accesses 2983 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_accesses_0 2983 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_avg_miss_latency_0 5910.313901 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency_0 5152.173913 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_hits 2314 # number of ReadReq hits
system.cpu.icache.ReadReq_hits_0 2314 # number of ReadReq hits
system.cpu.icache.ReadReq_miss_latency 3954000 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_latency_0 3954000 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_rate_0 0.224271 # miss rate for ReadReq accesses
system.cpu.icache.ReadReq_misses 669 # number of ReadReq misses
system.cpu.icache.ReadReq_misses_0 669 # number of ReadReq misses
system.cpu.icache.ReadReq_mshr_hits 48 # number of ReadReq MSHR hits
system.cpu.icache.ReadReq_mshr_hits_0 48 # number of ReadReq MSHR hits
system.cpu.icache.ReadReq_mshr_miss_latency 3199500 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_latency_0 3199500 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_rate_0 0.208180 # mshr miss rate for ReadReq accesses
system.cpu.icache.ReadReq_mshr_misses 621 # number of ReadReq MSHR misses
system.cpu.icache.ReadReq_mshr_misses_0 621 # number of ReadReq MSHR misses
system.cpu.icache.ReadReq_accesses 3009 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_accesses_0 3009 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_avg_miss_latency_0 5911.144578 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency_0 5119.774920 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_hits 2345 # number of ReadReq hits
system.cpu.icache.ReadReq_hits_0 2345 # number of ReadReq hits
system.cpu.icache.ReadReq_miss_latency 3925000 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_latency_0 3925000 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_rate_0 0.220671 # miss rate for ReadReq accesses
system.cpu.icache.ReadReq_misses 664 # number of ReadReq misses
system.cpu.icache.ReadReq_misses_0 664 # number of ReadReq misses
system.cpu.icache.ReadReq_mshr_hits 42 # number of ReadReq MSHR hits
system.cpu.icache.ReadReq_mshr_hits_0 42 # number of ReadReq MSHR hits
system.cpu.icache.ReadReq_mshr_miss_latency 3184500 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_latency_0 3184500 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_rate_0 0.206713 # mshr miss rate for ReadReq accesses
system.cpu.icache.ReadReq_mshr_misses 622 # number of ReadReq MSHR misses
system.cpu.icache.ReadReq_mshr_misses_0 622 # number of ReadReq MSHR misses
system.cpu.icache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.icache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.icache.avg_refs 3.726248 # Average number of references to valid blocks.
system.cpu.icache.avg_refs 3.770096 # Average number of references to valid blocks.
system.cpu.icache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.icache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.icache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.icache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.icache.cache_copies 0 # number of cache copies performed
system.cpu.icache.demand_accesses 2983 # number of demand (read+write) accesses
system.cpu.icache.demand_accesses_0 2983 # number of demand (read+write) accesses
system.cpu.icache.demand_accesses 3009 # number of demand (read+write) accesses
system.cpu.icache.demand_accesses_0 3009 # number of demand (read+write) accesses
system.cpu.icache.demand_accesses_1 0 # number of demand (read+write) accesses
system.cpu.icache.demand_avg_miss_latency <err: div-0> # average overall miss latency
system.cpu.icache.demand_avg_miss_latency_0 5910.313901 # average overall miss latency
system.cpu.icache.demand_avg_miss_latency_0 5911.144578 # average overall miss latency
system.cpu.icache.demand_avg_miss_latency_1 <err: div-0> # average overall miss latency
system.cpu.icache.demand_avg_mshr_miss_latency <err: div-0> # average overall mshr miss latency
system.cpu.icache.demand_avg_mshr_miss_latency_0 5152.173913 # average overall mshr miss latency
system.cpu.icache.demand_avg_mshr_miss_latency_0 5119.774920 # average overall mshr miss latency
system.cpu.icache.demand_avg_mshr_miss_latency_1 <err: div-0> # average overall mshr miss latency
system.cpu.icache.demand_hits 2314 # number of demand (read+write) hits
system.cpu.icache.demand_hits_0 2314 # number of demand (read+write) hits
system.cpu.icache.demand_hits 2345 # number of demand (read+write) hits
system.cpu.icache.demand_hits_0 2345 # number of demand (read+write) hits
system.cpu.icache.demand_hits_1 0 # number of demand (read+write) hits
system.cpu.icache.demand_miss_latency 3954000 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_latency_0 3954000 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_latency 3925000 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_latency_0 3925000 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_latency_1 0 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_rate <err: div-0> # miss rate for demand accesses
system.cpu.icache.demand_miss_rate_0 0.224271 # miss rate for demand accesses
system.cpu.icache.demand_miss_rate_0 0.220671 # miss rate for demand accesses
system.cpu.icache.demand_miss_rate_1 <err: div-0> # miss rate for demand accesses
system.cpu.icache.demand_misses 669 # number of demand (read+write) misses
system.cpu.icache.demand_misses_0 669 # number of demand (read+write) misses
system.cpu.icache.demand_misses 664 # number of demand (read+write) misses
system.cpu.icache.demand_misses_0 664 # number of demand (read+write) misses
system.cpu.icache.demand_misses_1 0 # number of demand (read+write) misses
system.cpu.icache.demand_mshr_hits 48 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_hits_0 48 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_hits 42 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_hits_0 42 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_hits_1 0 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_miss_latency 3199500 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_latency_0 3199500 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_latency 3184500 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_latency_0 3184500 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_latency_1 0 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_rate <err: div-0> # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_miss_rate_0 0.208180 # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_miss_rate_0 0.206713 # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_miss_rate_1 <err: div-0> # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_misses 621 # number of demand (read+write) MSHR misses
system.cpu.icache.demand_mshr_misses_0 621 # number of demand (read+write) MSHR misses
system.cpu.icache.demand_mshr_misses 622 # number of demand (read+write) MSHR misses
system.cpu.icache.demand_mshr_misses_0 622 # number of demand (read+write) MSHR misses
system.cpu.icache.demand_mshr_misses_1 0 # number of demand (read+write) MSHR misses
system.cpu.icache.fast_writes 0 # number of fast writes performed
system.cpu.icache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.icache.mshr_cap_events_0 0 # number of times MSHR cap was activated
system.cpu.icache.mshr_cap_events_1 0 # number of times MSHR cap was activated
system.cpu.icache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.icache.overall_accesses 2983 # number of overall (read+write) accesses
system.cpu.icache.overall_accesses_0 2983 # number of overall (read+write) accesses
system.cpu.icache.overall_accesses 3009 # number of overall (read+write) accesses
system.cpu.icache.overall_accesses_0 3009 # number of overall (read+write) accesses
system.cpu.icache.overall_accesses_1 0 # number of overall (read+write) accesses
system.cpu.icache.overall_avg_miss_latency <err: div-0> # average overall miss latency
system.cpu.icache.overall_avg_miss_latency_0 5910.313901 # average overall miss latency
system.cpu.icache.overall_avg_miss_latency_0 5911.144578 # average overall miss latency
system.cpu.icache.overall_avg_miss_latency_1 <err: div-0> # average overall miss latency
system.cpu.icache.overall_avg_mshr_miss_latency <err: div-0> # average overall mshr miss latency
system.cpu.icache.overall_avg_mshr_miss_latency_0 5152.173913 # average overall mshr miss latency
system.cpu.icache.overall_avg_mshr_miss_latency_0 5119.774920 # average overall mshr miss latency
system.cpu.icache.overall_avg_mshr_miss_latency_1 <err: div-0> # average overall mshr miss latency
system.cpu.icache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.icache.overall_avg_mshr_uncacheable_latency_0 <err: div-0> # average overall mshr uncacheable latency
system.cpu.icache.overall_avg_mshr_uncacheable_latency_1 <err: div-0> # average overall mshr uncacheable latency
system.cpu.icache.overall_hits 2314 # number of overall hits
system.cpu.icache.overall_hits_0 2314 # number of overall hits
system.cpu.icache.overall_hits 2345 # number of overall hits
system.cpu.icache.overall_hits_0 2345 # number of overall hits
system.cpu.icache.overall_hits_1 0 # number of overall hits
system.cpu.icache.overall_miss_latency 3954000 # number of overall miss cycles
system.cpu.icache.overall_miss_latency_0 3954000 # number of overall miss cycles
system.cpu.icache.overall_miss_latency 3925000 # number of overall miss cycles
system.cpu.icache.overall_miss_latency_0 3925000 # number of overall miss cycles
system.cpu.icache.overall_miss_latency_1 0 # number of overall miss cycles
system.cpu.icache.overall_miss_rate <err: div-0> # miss rate for overall accesses
system.cpu.icache.overall_miss_rate_0 0.224271 # miss rate for overall accesses
system.cpu.icache.overall_miss_rate_0 0.220671 # miss rate for overall accesses
system.cpu.icache.overall_miss_rate_1 <err: div-0> # miss rate for overall accesses
system.cpu.icache.overall_misses 669 # number of overall misses
system.cpu.icache.overall_misses_0 669 # number of overall misses
system.cpu.icache.overall_misses 664 # number of overall misses
system.cpu.icache.overall_misses_0 664 # number of overall misses
system.cpu.icache.overall_misses_1 0 # number of overall misses
system.cpu.icache.overall_mshr_hits 48 # number of overall MSHR hits
system.cpu.icache.overall_mshr_hits_0 48 # number of overall MSHR hits
system.cpu.icache.overall_mshr_hits 42 # number of overall MSHR hits
system.cpu.icache.overall_mshr_hits_0 42 # number of overall MSHR hits
system.cpu.icache.overall_mshr_hits_1 0 # number of overall MSHR hits
system.cpu.icache.overall_mshr_miss_latency 3199500 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_latency_0 3199500 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_latency 3184500 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_latency_0 3184500 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_latency_1 0 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_rate <err: div-0> # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_miss_rate_0 0.208180 # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_miss_rate_0 0.206713 # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_miss_rate_1 <err: div-0> # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_misses 621 # number of overall MSHR misses
system.cpu.icache.overall_mshr_misses_0 621 # number of overall MSHR misses
system.cpu.icache.overall_mshr_misses 622 # number of overall MSHR misses
system.cpu.icache.overall_mshr_misses_0 622 # number of overall MSHR misses
system.cpu.icache.overall_mshr_misses_1 0 # number of overall MSHR misses
system.cpu.icache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.icache.overall_mshr_uncacheable_latency_0 0 # number of overall MSHR uncacheable cycles
@ -368,104 +369,104 @@ system.cpu.icache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.icache.replacements 9 # number of replacements
system.cpu.icache.replacements_0 9 # number of replacements
system.cpu.icache.replacements_1 0 # number of replacements
system.cpu.icache.sampled_refs 621 # Sample count of references to valid blocks.
system.cpu.icache.sampled_refs 622 # Sample count of references to valid blocks.
system.cpu.icache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.icache.soft_prefetch_mshr_full_0 0 # number of mshr full events for SW prefetching instrutions
system.cpu.icache.soft_prefetch_mshr_full_1 0 # number of mshr full events for SW prefetching instrutions
system.cpu.icache.tagsinuse 322.894952 # Cycle average of tags in use
system.cpu.icache.total_refs 2314 # Total number of references to valid blocks.
system.cpu.icache.tagsinuse 323.196356 # Cycle average of tags in use
system.cpu.icache.total_refs 2345 # Total number of references to valid blocks.
system.cpu.icache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.icache.writebacks 0 # number of writebacks
system.cpu.icache.writebacks_0 0 # number of writebacks
system.cpu.icache.writebacks_1 0 # number of writebacks
system.cpu.idleCycles 1998 # Total number of cycles that the CPU has spent unscheduled due to idling
system.cpu.iew.EXEC:branches 2367 # Number of branches executed
system.cpu.iew.EXEC:branches_0 1185 # Number of branches executed
system.cpu.iew.EXEC:branches_1 1182 # Number of branches executed
system.cpu.iew.EXEC:nop 73 # number of nop insts executed
system.cpu.idleCycles 2997 # Total number of cycles that the CPU has spent unscheduled due to idling
system.cpu.iew.EXEC:branches 2377 # Number of branches executed
system.cpu.iew.EXEC:branches_0 1192 # Number of branches executed
system.cpu.iew.EXEC:branches_1 1185 # Number of branches executed
system.cpu.iew.EXEC:nop 72 # number of nop insts executed
system.cpu.iew.EXEC:nop_0 37 # number of nop insts executed
system.cpu.iew.EXEC:nop_1 36 # number of nop insts executed
system.cpu.iew.EXEC:rate 1.416158 # Inst execution rate
system.cpu.iew.EXEC:refs 4978 # number of memory reference insts executed
system.cpu.iew.EXEC:refs_0 2514 # number of memory reference insts executed
system.cpu.iew.EXEC:refs_1 2464 # number of memory reference insts executed
system.cpu.iew.EXEC:stores 1867 # Number of stores executed
system.cpu.iew.EXEC:stores_0 938 # Number of stores executed
system.cpu.iew.EXEC:stores_1 929 # Number of stores executed
system.cpu.iew.EXEC:nop_1 35 # number of nop insts executed
system.cpu.iew.EXEC:rate 1.419725 # Inst execution rate
system.cpu.iew.EXEC:refs 5002 # number of memory reference insts executed
system.cpu.iew.EXEC:refs_0 2507 # number of memory reference insts executed
system.cpu.iew.EXEC:refs_1 2495 # number of memory reference insts executed
system.cpu.iew.EXEC:stores 1874 # Number of stores executed
system.cpu.iew.EXEC:stores_0 933 # Number of stores executed
system.cpu.iew.EXEC:stores_1 941 # Number of stores executed
system.cpu.iew.EXEC:swp 0 # number of swp insts executed
system.cpu.iew.EXEC:swp_0 0 # number of swp insts executed
system.cpu.iew.EXEC:swp_1 0 # number of swp insts executed
system.cpu.iew.WB:consumers 10219 # num instructions consuming a value
system.cpu.iew.WB:consumers_0 5113 # num instructions consuming a value
system.cpu.iew.WB:consumers_1 5106 # num instructions consuming a value
system.cpu.iew.WB:count 14974 # cumulative count of insts written-back
system.cpu.iew.WB:count_0 7532 # cumulative count of insts written-back
system.cpu.iew.WB:count_1 7442 # cumulative count of insts written-back
system.cpu.iew.WB:fanout 1.526960 # average fanout of values written-back
system.cpu.iew.WB:fanout_0 0.762957 # average fanout of values written-back
system.cpu.iew.WB:fanout_1 0.764003 # average fanout of values written-back
system.cpu.iew.WB:consumers 10260 # num instructions consuming a value
system.cpu.iew.WB:consumers_0 5135 # num instructions consuming a value
system.cpu.iew.WB:consumers_1 5125 # num instructions consuming a value
system.cpu.iew.WB:count 14994 # cumulative count of insts written-back
system.cpu.iew.WB:count_0 7526 # cumulative count of insts written-back
system.cpu.iew.WB:count_1 7468 # cumulative count of insts written-back
system.cpu.iew.WB:fanout 1.530607 # average fanout of values written-back
system.cpu.iew.WB:fanout_0 0.763778 # average fanout of values written-back
system.cpu.iew.WB:fanout_1 0.766829 # average fanout of values written-back
system.cpu.iew.WB:penalized 0 # number of instrctions required to write to 'other' IQ
system.cpu.iew.WB:penalized_0 0 # number of instrctions required to write to 'other' IQ
system.cpu.iew.WB:penalized_1 0 # number of instrctions required to write to 'other' IQ
system.cpu.iew.WB:penalized_rate 0 # fraction of instructions written-back that wrote to 'other' IQ
system.cpu.iew.WB:penalized_rate_0 0 # fraction of instructions written-back that wrote to 'other' IQ
system.cpu.iew.WB:penalized_rate_1 0 # fraction of instructions written-back that wrote to 'other' IQ
system.cpu.iew.WB:producers 7802 # num instructions producing a value
system.cpu.iew.WB:producers_0 3901 # num instructions producing a value
system.cpu.iew.WB:producers_1 3901 # num instructions producing a value
system.cpu.iew.WB:rate 1.363876 # insts written-back per cycle
system.cpu.iew.WB:rate_0 0.686037 # insts written-back per cycle
system.cpu.iew.WB:rate_1 0.677840 # insts written-back per cycle
system.cpu.iew.WB:sent 15105 # cumulative count of insts sent to commit
system.cpu.iew.WB:sent_0 7590 # cumulative count of insts sent to commit
system.cpu.iew.WB:sent_1 7515 # cumulative count of insts sent to commit
system.cpu.iew.branchMispredicts 941 # Number of branch mispredicts detected at execute
system.cpu.iew.iewBlockCycles 7 # Number of cycles IEW is blocking
system.cpu.iew.iewDispLoadInsts 3823 # Number of dispatched load instructions
system.cpu.iew.WB:producers 7852 # num instructions producing a value
system.cpu.iew.WB:producers_0 3922 # num instructions producing a value
system.cpu.iew.WB:producers_1 3930 # num instructions producing a value
system.cpu.iew.WB:rate 1.365449 # insts written-back per cycle
system.cpu.iew.WB:rate_0 0.685366 # insts written-back per cycle
system.cpu.iew.WB:rate_1 0.680084 # insts written-back per cycle
system.cpu.iew.WB:sent 15132 # cumulative count of insts sent to commit
system.cpu.iew.WB:sent_0 7582 # cumulative count of insts sent to commit
system.cpu.iew.WB:sent_1 7550 # cumulative count of insts sent to commit
system.cpu.iew.branchMispredicts 958 # Number of branch mispredicts detected at execute
system.cpu.iew.iewBlockCycles 6 # Number of cycles IEW is blocking
system.cpu.iew.iewDispLoadInsts 3837 # Number of dispatched load instructions
system.cpu.iew.iewDispNonSpecInsts 42 # Number of dispatched non-speculative instructions
system.cpu.iew.iewDispSquashedInsts 501 # Number of squashed instructions skipped by dispatch
system.cpu.iew.iewDispStoreInsts 2178 # Number of dispatched store instructions
system.cpu.iew.iewDispatchedInsts 19078 # Number of instructions dispatched to IQ
system.cpu.iew.iewExecLoadInsts 3111 # Number of load instructions executed
system.cpu.iew.iewExecLoadInsts_0 1576 # Number of load instructions executed
system.cpu.iew.iewExecLoadInsts_1 1535 # Number of load instructions executed
system.cpu.iew.iewExecSquashedInsts 864 # Number of squashed instructions skipped in execute
system.cpu.iew.iewExecutedInsts 15548 # Number of executed instructions
system.cpu.iew.iewDispSquashedInsts 445 # Number of squashed instructions skipped by dispatch
system.cpu.iew.iewDispStoreInsts 2172 # Number of dispatched store instructions
system.cpu.iew.iewDispatchedInsts 19086 # Number of instructions dispatched to IQ
system.cpu.iew.iewExecLoadInsts 3128 # Number of load instructions executed
system.cpu.iew.iewExecLoadInsts_0 1574 # Number of load instructions executed
system.cpu.iew.iewExecLoadInsts_1 1554 # Number of load instructions executed
system.cpu.iew.iewExecSquashedInsts 852 # Number of squashed instructions skipped in execute
system.cpu.iew.iewExecutedInsts 15590 # Number of executed instructions
system.cpu.iew.iewIQFullEvents 0 # Number of times the IQ has become full, causing a stall
system.cpu.iew.iewIdleCycles 0 # Number of cycles IEW is idle
system.cpu.iew.iewLSQFullEvents 0 # Number of times the LSQ has become full, causing a stall
system.cpu.iew.iewSquashCycles 1498 # Number of cycles IEW is squashing
system.cpu.iew.iewSquashCycles 1511 # Number of cycles IEW is squashing
system.cpu.iew.iewUnblockCycles 0 # Number of cycles IEW is unblocking
system.cpu.iew.lsq.thread.0.blockedLoads 0 # Number of blocked loads due to partial load-store forwarding
system.cpu.iew.lsq.thread.0.cacheBlocked 0 # Number of times an access to memory failed due to the cache being blocked
system.cpu.iew.lsq.thread.0.forwLoads 42 # Number of loads that had data forwarded from stores
system.cpu.iew.lsq.thread.0.forwLoads 43 # Number of loads that had data forwarded from stores
system.cpu.iew.lsq.thread.0.ignoredResponses 4 # Number of memory responses ignored because the instruction is squashed
system.cpu.iew.lsq.thread.0.invAddrLoads 0 # Number of loads ignored due to an invalid address
system.cpu.iew.lsq.thread.0.invAddrSwpfs 0 # Number of software prefetches ignored due to an invalid address
system.cpu.iew.lsq.thread.0.memOrderViolation 63 # Number of memory ordering violations
system.cpu.iew.lsq.thread.0.memOrderViolation 64 # Number of memory ordering violations
system.cpu.iew.lsq.thread.0.rescheduledLoads 1 # Number of loads that were rescheduled
system.cpu.iew.lsq.thread.0.squashedLoads 946 # Number of loads squashed
system.cpu.iew.lsq.thread.0.squashedStores 276 # Number of stores squashed
system.cpu.iew.lsq.thread.0.squashedLoads 955 # Number of loads squashed
system.cpu.iew.lsq.thread.0.squashedStores 270 # Number of stores squashed
system.cpu.iew.lsq.thread.1.blockedLoads 0 # Number of blocked loads due to partial load-store forwarding
system.cpu.iew.lsq.thread.1.cacheBlocked 0 # Number of times an access to memory failed due to the cache being blocked
system.cpu.iew.lsq.thread.1.forwLoads 38 # Number of loads that had data forwarded from stores
system.cpu.iew.lsq.thread.1.ignoredResponses 0 # Number of memory responses ignored because the instruction is squashed
system.cpu.iew.lsq.thread.1.forwLoads 42 # Number of loads that had data forwarded from stores
system.cpu.iew.lsq.thread.1.ignoredResponses 2 # Number of memory responses ignored because the instruction is squashed
system.cpu.iew.lsq.thread.1.invAddrLoads 0 # Number of loads ignored due to an invalid address
system.cpu.iew.lsq.thread.1.invAddrSwpfs 0 # Number of software prefetches ignored due to an invalid address
system.cpu.iew.lsq.thread.1.memOrderViolation 54 # Number of memory ordering violations
system.cpu.iew.lsq.thread.1.memOrderViolation 58 # Number of memory ordering violations
system.cpu.iew.lsq.thread.1.rescheduledLoads 1 # Number of loads that were rescheduled
system.cpu.iew.lsq.thread.1.squashedLoads 919 # Number of loads squashed
system.cpu.iew.lsq.thread.1.squashedLoads 924 # Number of loads squashed
system.cpu.iew.lsq.thread.1.squashedStores 278 # Number of stores squashed
system.cpu.iew.memOrderViolationEvents 117 # Number of memory order violations
system.cpu.iew.predictedNotTakenIncorrect 761 # Number of branches that were predicted not taken incorrectly
system.cpu.iew.predictedTakenIncorrect 180 # Number of branches that were predicted taken incorrectly
system.cpu.ipc_0 0.512160 # IPC: Instructions Per Cycle
system.cpu.ipc_1 0.512251 # IPC: Instructions Per Cycle
system.cpu.ipc_total 1.024410 # IPC: Total IPC of All Threads
system.cpu.iq.ISSUE:FU_type_0 8232 # Type of FU issued
system.cpu.iew.memOrderViolationEvents 122 # Number of memory order violations
system.cpu.iew.predictedNotTakenIncorrect 767 # Number of branches that were predicted not taken incorrectly
system.cpu.iew.predictedTakenIncorrect 191 # Number of branches that were predicted taken incorrectly
system.cpu.ipc_0 0.512066 # IPC: Instructions Per Cycle
system.cpu.ipc_1 0.512157 # IPC: Instructions Per Cycle
system.cpu.ipc_total 1.024224 # IPC: Total IPC of All Threads
system.cpu.iq.ISSUE:FU_type_0 8235 # Type of FU issued
system.cpu.iq.ISSUE:FU_type_0.start_dist
No_OpClass 2 0.02% # Type of FU issued
IntAlu 5551 67.43% # Type of FU issued
IntAlu 5567 67.60% # Type of FU issued
IntMult 1 0.01% # Type of FU issued
IntDiv 0 0.00% # Type of FU issued
FloatAdd 2 0.02% # Type of FU issued
@ -474,15 +475,15 @@ system.cpu.iq.ISSUE:FU_type_0.start_dist
FloatMult 0 0.00% # Type of FU issued
FloatDiv 0 0.00% # Type of FU issued
FloatSqrt 0 0.00% # Type of FU issued
MemRead 1704 20.70% # Type of FU issued
MemWrite 972 11.81% # Type of FU issued
MemRead 1702 20.67% # Type of FU issued
MemWrite 961 11.67% # Type of FU issued
IprAccess 0 0.00% # Type of FU issued
InstPrefetch 0 0.00% # Type of FU issued
system.cpu.iq.ISSUE:FU_type_0.end_dist
system.cpu.iq.ISSUE:FU_type_1 8180 # Type of FU issued
system.cpu.iq.ISSUE:FU_type_1 8207 # Type of FU issued
system.cpu.iq.ISSUE:FU_type_1.start_dist
No_OpClass 2 0.02% # Type of FU issued
IntAlu 5536 67.68% # Type of FU issued
IntAlu 5547 67.59% # Type of FU issued
IntMult 1 0.01% # Type of FU issued
IntDiv 0 0.00% # Type of FU issued
FloatAdd 2 0.02% # Type of FU issued
@ -491,15 +492,15 @@ system.cpu.iq.ISSUE:FU_type_1.start_dist
FloatMult 0 0.00% # Type of FU issued
FloatDiv 0 0.00% # Type of FU issued
FloatSqrt 0 0.00% # Type of FU issued
MemRead 1681 20.55% # Type of FU issued
MemWrite 958 11.71% # Type of FU issued
MemRead 1690 20.59% # Type of FU issued
MemWrite 965 11.76% # Type of FU issued
IprAccess 0 0.00% # Type of FU issued
InstPrefetch 0 0.00% # Type of FU issued
system.cpu.iq.ISSUE:FU_type_1.end_dist
system.cpu.iq.ISSUE:FU_type 16412 # Type of FU issued
system.cpu.iq.ISSUE:FU_type 16442 # Type of FU issued
system.cpu.iq.ISSUE:FU_type.start_dist
No_OpClass 4 0.02% # Type of FU issued
IntAlu 11087 67.55% # Type of FU issued
IntAlu 11114 67.60% # Type of FU issued
IntMult 2 0.01% # Type of FU issued
IntDiv 0 0.00% # Type of FU issued
FloatAdd 4 0.02% # Type of FU issued
@ -508,20 +509,20 @@ system.cpu.iq.ISSUE:FU_type.start_dist
FloatMult 0 0.00% # Type of FU issued
FloatDiv 0 0.00% # Type of FU issued
FloatSqrt 0 0.00% # Type of FU issued
MemRead 3385 20.63% # Type of FU issued
MemWrite 1930 11.76% # Type of FU issued
MemRead 3392 20.63% # Type of FU issued
MemWrite 1926 11.71% # Type of FU issued
IprAccess 0 0.00% # Type of FU issued
InstPrefetch 0 0.00% # Type of FU issued
system.cpu.iq.ISSUE:FU_type.end_dist
system.cpu.iq.ISSUE:fu_busy_cnt 180 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_cnt_0 92 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_cnt_1 88 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_rate 0.010968 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_busy_rate_0 0.005606 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_busy_rate_1 0.005362 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_busy_cnt 189 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_cnt_0 98 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_cnt_1 91 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_rate 0.011495 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_busy_rate_0 0.005960 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_busy_rate_1 0.005535 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_full.start_dist
No_OpClass 0 0.00% # attempts to use FU when none available
IntAlu 16 8.89% # attempts to use FU when none available
IntAlu 14 7.41% # attempts to use FU when none available
IntMult 0 0.00% # attempts to use FU when none available
IntDiv 0 0.00% # attempts to use FU when none available
FloatAdd 0 0.00% # attempts to use FU when none available
@ -530,104 +531,104 @@ system.cpu.iq.ISSUE:fu_full.start_dist
FloatMult 0 0.00% # attempts to use FU when none available
FloatDiv 0 0.00% # attempts to use FU when none available
FloatSqrt 0 0.00% # attempts to use FU when none available
MemRead 97 53.89% # attempts to use FU when none available
MemWrite 67 37.22% # attempts to use FU when none available
MemRead 107 56.61% # attempts to use FU when none available
MemWrite 68 35.98% # attempts to use FU when none available
IprAccess 0 0.00% # attempts to use FU when none available
InstPrefetch 0 0.00% # attempts to use FU when none available
system.cpu.iq.ISSUE:fu_full.end_dist
system.cpu.iq.ISSUE:issued_per_cycle.start_dist # Number of insts issued each cycle
system.cpu.iq.ISSUE:issued_per_cycle.samples 10979
system.cpu.iq.ISSUE:issued_per_cycle.samples 10981
system.cpu.iq.ISSUE:issued_per_cycle.min_value 0
0 4788 4361.05%
1 1816 1654.07%
2 1657 1509.24%
3 1039 946.35%
4 774 704.98%
5 501 456.33%
6 289 263.23%
7 90 81.97%
8 25 22.77%
0 4775 4348.42%
1 1817 1654.68%
2 1638 1491.67%
3 1107 1008.10%
4 745 678.44%
5 490 446.23%
6 287 261.36%
7 100 91.07%
8 22 20.03%
system.cpu.iq.ISSUE:issued_per_cycle.max_value 8
system.cpu.iq.ISSUE:issued_per_cycle.end_dist
system.cpu.iq.ISSUE:rate 1.494854 # Inst issue rate
system.cpu.iq.iqInstsAdded 18963 # Number of instructions added to the IQ (excludes non-spec)
system.cpu.iq.iqInstsIssued 16412 # Number of instructions issued
system.cpu.iq.ISSUE:rate 1.497314 # Inst issue rate
system.cpu.iq.iqInstsAdded 18972 # Number of instructions added to the IQ (excludes non-spec)
system.cpu.iq.iqInstsIssued 16442 # Number of instructions issued
system.cpu.iq.iqNonSpecInstsAdded 42 # Number of non-speculative instructions added to the IQ
system.cpu.iq.iqSquashedInstsExamined 6896 # Number of squashed instructions iterated over during squash; mainly for profiling
system.cpu.iq.iqSquashedInstsIssued 34 # Number of squashed instructions issued
system.cpu.iq.iqSquashedInstsExamined 6918 # Number of squashed instructions iterated over during squash; mainly for profiling
system.cpu.iq.iqSquashedInstsIssued 63 # Number of squashed instructions issued
system.cpu.iq.iqSquashedNonSpecRemoved 8 # Number of squashed non-spec instructions that were removed
system.cpu.iq.iqSquashedOperandsExamined 4313 # Number of squashed operands that are examined and possibly removed from graph
system.cpu.l2cache.ReadReq_accesses 963 # number of ReadReq accesses(hits+misses)
system.cpu.l2cache.ReadReq_accesses_0 963 # number of ReadReq accesses(hits+misses)
system.cpu.l2cache.ReadReq_avg_miss_latency_0 5220.374220 # average ReadReq miss latency
system.cpu.l2cache.ReadReq_avg_mshr_miss_latency_0 2725.051975 # average ReadReq mshr miss latency
system.cpu.iq.iqSquashedOperandsExamined 4274 # Number of squashed operands that are examined and possibly removed from graph
system.cpu.l2cache.ReadReq_accesses 962 # number of ReadReq accesses(hits+misses)
system.cpu.l2cache.ReadReq_accesses_0 962 # number of ReadReq accesses(hits+misses)
system.cpu.l2cache.ReadReq_avg_miss_latency_0 5208.636837 # average ReadReq miss latency
system.cpu.l2cache.ReadReq_avg_mshr_miss_latency_0 2724.765869 # average ReadReq mshr miss latency
system.cpu.l2cache.ReadReq_hits 1 # number of ReadReq hits
system.cpu.l2cache.ReadReq_hits_0 1 # number of ReadReq hits
system.cpu.l2cache.ReadReq_miss_latency 5022000 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_latency_0 5022000 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_rate_0 0.998962 # miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_misses 962 # number of ReadReq misses
system.cpu.l2cache.ReadReq_misses_0 962 # number of ReadReq misses
system.cpu.l2cache.ReadReq_mshr_miss_latency 2621500 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_latency_0 2621500 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_rate_0 0.998962 # mshr miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_mshr_misses 962 # number of ReadReq MSHR misses
system.cpu.l2cache.ReadReq_mshr_misses_0 962 # number of ReadReq MSHR misses
system.cpu.l2cache.ReadReq_miss_latency 5005500 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_latency_0 5005500 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_rate_0 0.998960 # miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_misses 961 # number of ReadReq misses
system.cpu.l2cache.ReadReq_misses_0 961 # number of ReadReq misses
system.cpu.l2cache.ReadReq_mshr_miss_latency 2618500 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_latency_0 2618500 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_rate_0 0.998960 # mshr miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_mshr_misses 961 # number of ReadReq MSHR misses
system.cpu.l2cache.ReadReq_mshr_misses_0 961 # number of ReadReq MSHR misses
system.cpu.l2cache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.l2cache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.l2cache.avg_refs 0.001040 # Average number of references to valid blocks.
system.cpu.l2cache.avg_refs 0.001041 # Average number of references to valid blocks.
system.cpu.l2cache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.l2cache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.l2cache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.l2cache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.l2cache.cache_copies 0 # number of cache copies performed
system.cpu.l2cache.demand_accesses 963 # number of demand (read+write) accesses
system.cpu.l2cache.demand_accesses_0 963 # number of demand (read+write) accesses
system.cpu.l2cache.demand_accesses 962 # number of demand (read+write) accesses
system.cpu.l2cache.demand_accesses_0 962 # number of demand (read+write) accesses
system.cpu.l2cache.demand_accesses_1 0 # number of demand (read+write) accesses
system.cpu.l2cache.demand_avg_miss_latency <err: div-0> # average overall miss latency
system.cpu.l2cache.demand_avg_miss_latency_0 5220.374220 # average overall miss latency
system.cpu.l2cache.demand_avg_miss_latency_0 5208.636837 # average overall miss latency
system.cpu.l2cache.demand_avg_miss_latency_1 <err: div-0> # average overall miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency <err: div-0> # average overall mshr miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency_0 2725.051975 # average overall mshr miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency_0 2724.765869 # average overall mshr miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency_1 <err: div-0> # average overall mshr miss latency
system.cpu.l2cache.demand_hits 1 # number of demand (read+write) hits
system.cpu.l2cache.demand_hits_0 1 # number of demand (read+write) hits
system.cpu.l2cache.demand_hits_1 0 # number of demand (read+write) hits
system.cpu.l2cache.demand_miss_latency 5022000 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_latency_0 5022000 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_latency 5005500 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_latency_0 5005500 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_latency_1 0 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_rate <err: div-0> # miss rate for demand accesses
system.cpu.l2cache.demand_miss_rate_0 0.998962 # miss rate for demand accesses
system.cpu.l2cache.demand_miss_rate_0 0.998960 # miss rate for demand accesses
system.cpu.l2cache.demand_miss_rate_1 <err: div-0> # miss rate for demand accesses
system.cpu.l2cache.demand_misses 962 # number of demand (read+write) misses
system.cpu.l2cache.demand_misses_0 962 # number of demand (read+write) misses
system.cpu.l2cache.demand_misses 961 # number of demand (read+write) misses
system.cpu.l2cache.demand_misses_0 961 # number of demand (read+write) misses
system.cpu.l2cache.demand_misses_1 0 # number of demand (read+write) misses
system.cpu.l2cache.demand_mshr_hits 0 # number of demand (read+write) MSHR hits
system.cpu.l2cache.demand_mshr_hits_0 0 # number of demand (read+write) MSHR hits
system.cpu.l2cache.demand_mshr_hits_1 0 # number of demand (read+write) MSHR hits
system.cpu.l2cache.demand_mshr_miss_latency 2621500 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_latency_0 2621500 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_latency 2618500 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_latency_0 2618500 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_latency_1 0 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_rate <err: div-0> # mshr miss rate for demand accesses
system.cpu.l2cache.demand_mshr_miss_rate_0 0.998962 # mshr miss rate for demand accesses
system.cpu.l2cache.demand_mshr_miss_rate_0 0.998960 # mshr miss rate for demand accesses
system.cpu.l2cache.demand_mshr_miss_rate_1 <err: div-0> # mshr miss rate for demand accesses
system.cpu.l2cache.demand_mshr_misses 962 # number of demand (read+write) MSHR misses
system.cpu.l2cache.demand_mshr_misses_0 962 # number of demand (read+write) MSHR misses
system.cpu.l2cache.demand_mshr_misses 961 # number of demand (read+write) MSHR misses
system.cpu.l2cache.demand_mshr_misses_0 961 # number of demand (read+write) MSHR misses
system.cpu.l2cache.demand_mshr_misses_1 0 # number of demand (read+write) MSHR misses
system.cpu.l2cache.fast_writes 0 # number of fast writes performed
system.cpu.l2cache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.l2cache.mshr_cap_events_0 0 # number of times MSHR cap was activated
system.cpu.l2cache.mshr_cap_events_1 0 # number of times MSHR cap was activated
system.cpu.l2cache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.l2cache.overall_accesses 963 # number of overall (read+write) accesses
system.cpu.l2cache.overall_accesses_0 963 # number of overall (read+write) accesses
system.cpu.l2cache.overall_accesses 962 # number of overall (read+write) accesses
system.cpu.l2cache.overall_accesses_0 962 # number of overall (read+write) accesses
system.cpu.l2cache.overall_accesses_1 0 # number of overall (read+write) accesses
system.cpu.l2cache.overall_avg_miss_latency <err: div-0> # average overall miss latency
system.cpu.l2cache.overall_avg_miss_latency_0 5220.374220 # average overall miss latency
system.cpu.l2cache.overall_avg_miss_latency_0 5208.636837 # average overall miss latency
system.cpu.l2cache.overall_avg_miss_latency_1 <err: div-0> # average overall miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency <err: div-0> # average overall mshr miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency_0 2725.051975 # average overall mshr miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency_0 2724.765869 # average overall mshr miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency_1 <err: div-0> # average overall mshr miss latency
system.cpu.l2cache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.l2cache.overall_avg_mshr_uncacheable_latency_0 <err: div-0> # average overall mshr uncacheable latency
@ -635,26 +636,26 @@ system.cpu.l2cache.overall_avg_mshr_uncacheable_latency_1 <err: div-0>
system.cpu.l2cache.overall_hits 1 # number of overall hits
system.cpu.l2cache.overall_hits_0 1 # number of overall hits
system.cpu.l2cache.overall_hits_1 0 # number of overall hits
system.cpu.l2cache.overall_miss_latency 5022000 # number of overall miss cycles
system.cpu.l2cache.overall_miss_latency_0 5022000 # number of overall miss cycles
system.cpu.l2cache.overall_miss_latency 5005500 # number of overall miss cycles
system.cpu.l2cache.overall_miss_latency_0 5005500 # number of overall miss cycles
system.cpu.l2cache.overall_miss_latency_1 0 # number of overall miss cycles
system.cpu.l2cache.overall_miss_rate <err: div-0> # miss rate for overall accesses
system.cpu.l2cache.overall_miss_rate_0 0.998962 # miss rate for overall accesses
system.cpu.l2cache.overall_miss_rate_0 0.998960 # miss rate for overall accesses
system.cpu.l2cache.overall_miss_rate_1 <err: div-0> # miss rate for overall accesses
system.cpu.l2cache.overall_misses 962 # number of overall misses
system.cpu.l2cache.overall_misses_0 962 # number of overall misses
system.cpu.l2cache.overall_misses 961 # number of overall misses
system.cpu.l2cache.overall_misses_0 961 # number of overall misses
system.cpu.l2cache.overall_misses_1 0 # number of overall misses
system.cpu.l2cache.overall_mshr_hits 0 # number of overall MSHR hits
system.cpu.l2cache.overall_mshr_hits_0 0 # number of overall MSHR hits
system.cpu.l2cache.overall_mshr_hits_1 0 # number of overall MSHR hits
system.cpu.l2cache.overall_mshr_miss_latency 2621500 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_latency_0 2621500 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_latency 2618500 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_latency_0 2618500 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_latency_1 0 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_rate <err: div-0> # mshr miss rate for overall accesses
system.cpu.l2cache.overall_mshr_miss_rate_0 0.998962 # mshr miss rate for overall accesses
system.cpu.l2cache.overall_mshr_miss_rate_0 0.998960 # mshr miss rate for overall accesses
system.cpu.l2cache.overall_mshr_miss_rate_1 <err: div-0> # mshr miss rate for overall accesses
system.cpu.l2cache.overall_mshr_misses 962 # number of overall MSHR misses
system.cpu.l2cache.overall_mshr_misses_0 962 # number of overall MSHR misses
system.cpu.l2cache.overall_mshr_misses 961 # number of overall MSHR misses
system.cpu.l2cache.overall_mshr_misses_0 961 # number of overall MSHR misses
system.cpu.l2cache.overall_mshr_misses_1 0 # number of overall MSHR misses
system.cpu.l2cache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.l2cache.overall_mshr_uncacheable_latency_0 0 # number of overall MSHR uncacheable cycles
@ -674,33 +675,33 @@ system.cpu.l2cache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.l2cache.replacements 0 # number of replacements
system.cpu.l2cache.replacements_0 0 # number of replacements
system.cpu.l2cache.replacements_1 0 # number of replacements
system.cpu.l2cache.sampled_refs 962 # Sample count of references to valid blocks.
system.cpu.l2cache.sampled_refs 961 # Sample count of references to valid blocks.
system.cpu.l2cache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.l2cache.soft_prefetch_mshr_full_0 0 # number of mshr full events for SW prefetching instrutions
system.cpu.l2cache.soft_prefetch_mshr_full_1 0 # number of mshr full events for SW prefetching instrutions
system.cpu.l2cache.tagsinuse 545.133409 # Cycle average of tags in use
system.cpu.l2cache.tagsinuse 545.318204 # Cycle average of tags in use
system.cpu.l2cache.total_refs 1 # Total number of references to valid blocks.
system.cpu.l2cache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.l2cache.writebacks 0 # number of writebacks
system.cpu.l2cache.writebacks_0 0 # number of writebacks
system.cpu.l2cache.writebacks_1 0 # number of writebacks
system.cpu.numCycles 10979 # number of cpu cycles simulated
system.cpu.rename.RENAME:BlockCycles 614 # Number of cycles rename is blocking
system.cpu.numCycles 10981 # number of cpu cycles simulated
system.cpu.rename.RENAME:BlockCycles 612 # Number of cycles rename is blocking
system.cpu.rename.RENAME:CommittedMaps 8102 # Number of HB maps that are committed
system.cpu.rename.RENAME:IdleCycles 14840 # Number of cycles rename is idle
system.cpu.rename.RENAME:LSQFullEvents 684 # Number of times rename has blocked due to LSQ full
system.cpu.rename.RENAME:RenameLookups 26359 # Number of register rename lookups that rename has made
system.cpu.rename.RENAME:RenamedInsts 20748 # Number of instructions processed by rename
system.cpu.rename.RENAME:RenamedOperands 15612 # Number of destination operands rename has renamed
system.cpu.rename.RENAME:RunCycles 3480 # Number of cycles rename is running
system.cpu.rename.RENAME:SquashCycles 1498 # Number of cycles rename is squashing
system.cpu.rename.RENAME:UnblockCycles 744 # Number of cycles rename is unblocking
system.cpu.rename.RENAME:UndoneMaps 7510 # Number of HB maps that are undone due to squashing
system.cpu.rename.RENAME:serializeStallCycles 517 # count of cycles rename stalled for serializing inst
system.cpu.rename.RENAME:IdleCycles 14828 # Number of cycles rename is idle
system.cpu.rename.RENAME:LSQFullEvents 692 # Number of times rename has blocked due to LSQ full
system.cpu.rename.RENAME:RenameLookups 26356 # Number of register rename lookups that rename has made
system.cpu.rename.RENAME:RenamedInsts 20731 # Number of instructions processed by rename
system.cpu.rename.RENAME:RenamedOperands 15606 # Number of destination operands rename has renamed
system.cpu.rename.RENAME:RunCycles 3494 # Number of cycles rename is running
system.cpu.rename.RENAME:SquashCycles 1511 # Number of cycles rename is squashing
system.cpu.rename.RENAME:UnblockCycles 761 # Number of cycles rename is unblocking
system.cpu.rename.RENAME:UndoneMaps 7504 # Number of HB maps that are undone due to squashing
system.cpu.rename.RENAME:serializeStallCycles 521 # count of cycles rename stalled for serializing inst
system.cpu.rename.RENAME:serializingInsts 48 # count of serializing insts renamed
system.cpu.rename.RENAME:skidInsts 2147 # count of insts added to the skid buffer
system.cpu.rename.RENAME:skidInsts 2159 # count of insts added to the skid buffer
system.cpu.rename.RENAME:tempSerializingInsts 37 # count of temporary serializing insts renamed
system.cpu.timesIdled 2 # Number of times that the entire CPU went into an idle state and unscheduled itself
system.cpu.timesIdled 3 # Number of times that the entire CPU went into an idle state and unscheduled itself
system.cpu.workload0.PROG:num_syscalls 17 # Number of system calls
system.cpu.workload1.PROG:num_syscalls 17 # Number of system calls

View file

@ -7,9 +7,9 @@ The Regents of The University of Michigan
All Rights Reserved
M5 compiled Jun 10 2007 14:06:20
M5 started Sun Jun 10 14:22:38 2007
M5 executing on iceaxe
command line: /Users/nate/build/outgoing/build/ALPHA_SE/m5.debug -d /Users/nate/build/outgoing/build/ALPHA_SE/tests/debug/quick/01.hello-2T-smt/alpha/linux/o3-timing tests/run.py quick/01.hello-2T-smt/alpha/linux/o3-timing
M5 compiled Jun 21 2007 21:25:27
M5 started Fri Jun 22 00:04:51 2007
M5 executing on zizzer.eecs.umich.edu
command line: build/ALPHA_SE/m5.fast -d build/ALPHA_SE/tests/fast/quick/01.hello-2T-smt/alpha/linux/o3-timing tests/run.py quick/01.hello-2T-smt/alpha/linux/o3-timing
Global frequency set at 1000000000000 ticks per second
Exiting @ tick 5490000 because target called exit()
Exiting @ tick 5491500 because target called exit()

View file

@ -21,6 +21,7 @@ SQEntries=32
SSITSize=1024
activity=0
backComSize=5
cachePorts=200
choiceCtrBits=2
choicePredictorSize=8192
clock=500
@ -74,6 +75,15 @@ renameToFetchDelay=1
renameToIEWDelay=2
renameToROBDelay=1
renameWidth=8
smtCommitPolicy=RoundRobin
smtFetchPolicy=SingleThread
smtIQPolicy=Partitioned
smtIQThreshold=100
smtLSQPolicy=Partitioned
smtLSQThreshold=100
smtNumFetchingThreads=1
smtROBPolicy=Partitioned
smtROBThreshold=100
squashWidth=8
system=system
trapLatency=13
@ -86,6 +96,7 @@ icache_port=system.cpu.icache.cpu_side
[system.cpu.dcache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -99,7 +110,7 @@ prefetch_access=false
prefetch_cache_check_push=true
prefetch_data_accesses_only=false
prefetch_degree=1
prefetch_latency=10
prefetch_latency=10000
prefetch_miss=false
prefetch_past_page=false
prefetch_policy=none
@ -261,6 +272,7 @@ opLat=3
[system.cpu.icache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -274,7 +286,7 @@ prefetch_access=false
prefetch_cache_check_push=true
prefetch_data_accesses_only=false
prefetch_degree=1
prefetch_latency=10
prefetch_latency=10000
prefetch_miss=false
prefetch_past_page=false
prefetch_policy=none
@ -299,6 +311,7 @@ mem_side=system.cpu.toL2Bus.port[0]
[system.cpu.l2cache]
type=BaseCache
adaptive_compression=false
addr_range=0:18446744073709551615
assoc=2
block_size=64
compressed_bus=false
@ -312,7 +325,7 @@ prefetch_access=false
prefetch_cache_check_push=true
prefetch_data_accesses_only=false
prefetch_degree=1
prefetch_latency=10
prefetch_latency=10000
prefetch_miss=false
prefetch_past_page=false
prefetch_policy=none
@ -366,7 +379,7 @@ bus_id=0
clock=1000
responder_set=false
width=64
port=system.physmem.port system.cpu.l2cache.mem_side
port=system.physmem.port[0] system.cpu.l2cache.mem_side
[system.physmem]
type=PhysicalMemory

View file

@ -275,7 +275,7 @@ prefetch_access=false
prefetcher_size=100
prefetch_past_page=false
prefetch_serial_squash=false
prefetch_latency=10
prefetch_latency=10000
prefetch_degree=1
prefetch_policy=none
prefetch_cache_check_push=true
@ -312,7 +312,7 @@ prefetch_access=false
prefetcher_size=100
prefetch_past_page=false
prefetch_serial_squash=false
prefetch_latency=10
prefetch_latency=10000
prefetch_degree=1
prefetch_policy=none
prefetch_cache_check_push=true
@ -349,7 +349,7 @@ prefetch_access=false
prefetcher_size=100
prefetch_past_page=false
prefetch_serial_squash=false
prefetch_latency=10
prefetch_latency=10000
prefetch_degree=1
prefetch_policy=none
prefetch_cache_check_push=true

View file

@ -1,40 +1,40 @@
---------- Begin Simulation Statistics ----------
global.BPredUnit.BTBCorrect 0 # Number of correct BTB predictions (this stat may not work properly.
global.BPredUnit.BTBHits 2726 # Number of BTB hits
global.BPredUnit.BTBLookups 7230 # Number of BTB lookups
global.BPredUnit.BTBHits 2589 # Number of BTB hits
global.BPredUnit.BTBLookups 6396 # Number of BTB lookups
global.BPredUnit.RASInCorrect 0 # Number of incorrect RAS predictions.
global.BPredUnit.condIncorrect 2062 # Number of conditional branches incorrect
global.BPredUnit.condPredicted 7954 # Number of conditional branches predicted
global.BPredUnit.lookups 7954 # Number of BP lookups
global.BPredUnit.condIncorrect 2002 # Number of conditional branches incorrect
global.BPredUnit.condPredicted 6955 # Number of conditional branches predicted
global.BPredUnit.lookups 6955 # Number of BP lookups
global.BPredUnit.usedRAS 0 # Number of times the RAS was used to get a target.
host_inst_rate 37089 # Simulator instruction rate (inst/s)
host_mem_usage 154932 # Number of bytes of host memory used
host_seconds 0.30 # Real time elapsed on the host
host_tick_rate 53780846 # Simulator tick rate (ticks/s)
host_inst_rate 33806 # Simulator instruction rate (inst/s)
host_mem_usage 154936 # Number of bytes of host memory used
host_seconds 0.32 # Real time elapsed on the host
host_tick_rate 48256964 # Simulator tick rate (ticks/s)
memdepunit.memDep.conflictingLoads 10 # Number of conflicting loads.
memdepunit.memDep.conflictingStores 0 # Number of conflicting stores.
memdepunit.memDep.insertedLoads 3198 # Number of loads inserted to the mem dependence unit.
memdepunit.memDep.insertedStores 2970 # Number of stores inserted to the mem dependence unit.
memdepunit.memDep.insertedLoads 2999 # Number of loads inserted to the mem dependence unit.
memdepunit.memDep.insertedStores 2872 # Number of stores inserted to the mem dependence unit.
sim_freq 1000000000000 # Frequency of simulated ticks
sim_insts 10976 # Number of instructions simulated
sim_seconds 0.000016 # Number of seconds simulated
sim_ticks 15931500 # Number of ticks simulated
sim_ticks 15682500 # Number of ticks simulated
system.cpu.commit.COM:branches 2152 # Number of branches committed
system.cpu.commit.COM:bw_lim_events 146 # number cycles where commit BW limit reached
system.cpu.commit.COM:bw_lim_events 199 # number cycles where commit BW limit reached
system.cpu.commit.COM:bw_limited 0 # number of insts not committed due to BW limits
system.cpu.commit.COM:committed_per_cycle.start_dist # Number of insts commited each cycle
system.cpu.commit.COM:committed_per_cycle.samples 28801
system.cpu.commit.COM:committed_per_cycle.samples 28561
system.cpu.commit.COM:committed_per_cycle.min_value 0
0 23411 8128.54%
1 2862 993.72%
2 1174 407.62%
3 608 211.10%
4 359 124.65%
5 123 42.71%
6 103 35.76%
7 15 5.21%
8 146 50.69%
0 23237 8135.92%
1 2855 999.61%
2 1132 396.34%
3 638 223.38%
4 273 95.58%
5 119 41.67%
6 92 32.21%
7 16 5.60%
8 199 69.68%
system.cpu.commit.COM:committed_per_cycle.max_value 8
system.cpu.commit.COM:committed_per_cycle.end_dist
@ -43,71 +43,71 @@ system.cpu.commit.COM:loads 1462 # Nu
system.cpu.commit.COM:membars 0 # Number of memory barriers committed
system.cpu.commit.COM:refs 2760 # Number of memory references committed
system.cpu.commit.COM:swp_count 0 # Number of s/w prefetches committed
system.cpu.commit.branchMispredicts 2062 # The number of times a branch was mispredicted
system.cpu.commit.branchMispredicts 2002 # The number of times a branch was mispredicted
system.cpu.commit.commitCommittedInsts 10976 # The number of committed instructions
system.cpu.commit.commitNonSpecStalls 327 # The number of times commit has been forced to stall to communicate backwards
system.cpu.commit.commitSquashedInsts 14297 # The number of squashed insts skipped by commit
system.cpu.commit.commitNonSpecStalls 329 # The number of times commit has been forced to stall to communicate backwards
system.cpu.commit.commitSquashedInsts 12659 # The number of squashed insts skipped by commit
system.cpu.committedInsts 10976 # Number of Instructions Simulated
system.cpu.committedInsts_total 10976 # Number of Instructions Simulated
system.cpu.cpi 2.903061 # CPI: Cycles Per Instruction
system.cpu.cpi_total 2.903061 # CPI: Total CPI of All Threads
system.cpu.dcache.ReadReq_accesses 2743 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_avg_miss_latency 5392.857143 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency 4696.969697 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_hits 2659 # number of ReadReq hits
system.cpu.dcache.ReadReq_miss_latency 453000 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_rate 0.030623 # miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_misses 84 # number of ReadReq misses
system.cpu.dcache.ReadReq_mshr_hits 18 # number of ReadReq MSHR hits
system.cpu.dcache.ReadReq_mshr_miss_latency 310000 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_rate 0.024061 # mshr miss rate for ReadReq accesses
system.cpu.cpi 2.857598 # CPI: Cycles Per Instruction
system.cpu.cpi_total 2.857598 # CPI: Total CPI of All Threads
system.cpu.dcache.ReadReq_accesses 2313 # number of ReadReq accesses(hits+misses)
system.cpu.dcache.ReadReq_avg_miss_latency 5451.807229 # average ReadReq miss latency
system.cpu.dcache.ReadReq_avg_mshr_miss_latency 4719.696970 # average ReadReq mshr miss latency
system.cpu.dcache.ReadReq_hits 2230 # number of ReadReq hits
system.cpu.dcache.ReadReq_miss_latency 452500 # number of ReadReq miss cycles
system.cpu.dcache.ReadReq_miss_rate 0.035884 # miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_misses 83 # number of ReadReq misses
system.cpu.dcache.ReadReq_mshr_hits 17 # number of ReadReq MSHR hits
system.cpu.dcache.ReadReq_mshr_miss_latency 311500 # number of ReadReq MSHR miss cycles
system.cpu.dcache.ReadReq_mshr_miss_rate 0.028534 # mshr miss rate for ReadReq accesses
system.cpu.dcache.ReadReq_mshr_misses 66 # number of ReadReq MSHR misses
system.cpu.dcache.SwapReq_accesses 6 # number of SwapReq accesses(hits+misses)
system.cpu.dcache.SwapReq_hits 6 # number of SwapReq hits
system.cpu.dcache.WriteReq_accesses 1292 # number of WriteReq accesses(hits+misses)
system.cpu.dcache.WriteReq_avg_miss_latency 5505 # average WriteReq miss latency
system.cpu.dcache.WriteReq_avg_miss_latency 5522.613065 # average WriteReq miss latency
system.cpu.dcache.WriteReq_avg_mshr_miss_latency 4802.325581 # average WriteReq mshr miss latency
system.cpu.dcache.WriteReq_hits 1092 # number of WriteReq hits
system.cpu.dcache.WriteReq_miss_latency 1101000 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_rate 0.154799 # miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_misses 200 # number of WriteReq misses
system.cpu.dcache.WriteReq_mshr_hits 114 # number of WriteReq MSHR hits
system.cpu.dcache.WriteReq_hits 1093 # number of WriteReq hits
system.cpu.dcache.WriteReq_miss_latency 1099000 # number of WriteReq miss cycles
system.cpu.dcache.WriteReq_miss_rate 0.154025 # miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_misses 199 # number of WriteReq misses
system.cpu.dcache.WriteReq_mshr_hits 113 # number of WriteReq MSHR hits
system.cpu.dcache.WriteReq_mshr_miss_latency 413000 # number of WriteReq MSHR miss cycles
system.cpu.dcache.WriteReq_mshr_miss_rate 0.066563 # mshr miss rate for WriteReq accesses
system.cpu.dcache.WriteReq_mshr_misses 86 # number of WriteReq MSHR misses
system.cpu.dcache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.dcache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.dcache.avg_refs 24.717105 # Average number of references to valid blocks.
system.cpu.dcache.avg_refs 21.901316 # Average number of references to valid blocks.
system.cpu.dcache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.dcache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.dcache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.dcache.cache_copies 0 # number of cache copies performed
system.cpu.dcache.demand_accesses 4035 # number of demand (read+write) accesses
system.cpu.dcache.demand_avg_miss_latency 5471.830986 # average overall miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency 4756.578947 # average overall mshr miss latency
system.cpu.dcache.demand_hits 3751 # number of demand (read+write) hits
system.cpu.dcache.demand_miss_latency 1554000 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_rate 0.070384 # miss rate for demand accesses
system.cpu.dcache.demand_misses 284 # number of demand (read+write) misses
system.cpu.dcache.demand_mshr_hits 132 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_miss_latency 723000 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_rate 0.037670 # mshr miss rate for demand accesses
system.cpu.dcache.demand_accesses 3605 # number of demand (read+write) accesses
system.cpu.dcache.demand_avg_miss_latency 5501.773050 # average overall miss latency
system.cpu.dcache.demand_avg_mshr_miss_latency 4766.447368 # average overall mshr miss latency
system.cpu.dcache.demand_hits 3323 # number of demand (read+write) hits
system.cpu.dcache.demand_miss_latency 1551500 # number of demand (read+write) miss cycles
system.cpu.dcache.demand_miss_rate 0.078225 # miss rate for demand accesses
system.cpu.dcache.demand_misses 282 # number of demand (read+write) misses
system.cpu.dcache.demand_mshr_hits 130 # number of demand (read+write) MSHR hits
system.cpu.dcache.demand_mshr_miss_latency 724500 # number of demand (read+write) MSHR miss cycles
system.cpu.dcache.demand_mshr_miss_rate 0.042164 # mshr miss rate for demand accesses
system.cpu.dcache.demand_mshr_misses 152 # number of demand (read+write) MSHR misses
system.cpu.dcache.fast_writes 0 # number of fast writes performed
system.cpu.dcache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.dcache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.dcache.overall_accesses 4035 # number of overall (read+write) accesses
system.cpu.dcache.overall_avg_miss_latency 5471.830986 # average overall miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency 4756.578947 # average overall mshr miss latency
system.cpu.dcache.overall_accesses 3605 # number of overall (read+write) accesses
system.cpu.dcache.overall_avg_miss_latency 5501.773050 # average overall miss latency
system.cpu.dcache.overall_avg_mshr_miss_latency 4766.447368 # average overall mshr miss latency
system.cpu.dcache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.dcache.overall_hits 3751 # number of overall hits
system.cpu.dcache.overall_miss_latency 1554000 # number of overall miss cycles
system.cpu.dcache.overall_miss_rate 0.070384 # miss rate for overall accesses
system.cpu.dcache.overall_misses 284 # number of overall misses
system.cpu.dcache.overall_mshr_hits 132 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_miss_latency 723000 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_rate 0.037670 # mshr miss rate for overall accesses
system.cpu.dcache.overall_hits 3323 # number of overall hits
system.cpu.dcache.overall_miss_latency 1551500 # number of overall miss cycles
system.cpu.dcache.overall_miss_rate 0.078225 # miss rate for overall accesses
system.cpu.dcache.overall_misses 282 # number of overall misses
system.cpu.dcache.overall_mshr_hits 130 # number of overall MSHR hits
system.cpu.dcache.overall_mshr_miss_latency 724500 # number of overall MSHR miss cycles
system.cpu.dcache.overall_mshr_miss_rate 0.042164 # mshr miss rate for overall accesses
system.cpu.dcache.overall_mshr_misses 152 # number of overall MSHR misses
system.cpu.dcache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.dcache.overall_mshr_uncacheable_misses 0 # number of overall MSHR uncacheable misses
@ -123,85 +123,85 @@ system.cpu.dcache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.dcache.replacements 0 # number of replacements
system.cpu.dcache.sampled_refs 152 # Sample count of references to valid blocks.
system.cpu.dcache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.dcache.tagsinuse 113.439038 # Cycle average of tags in use
system.cpu.dcache.total_refs 3757 # Total number of references to valid blocks.
system.cpu.dcache.tagsinuse 113.060803 # Cycle average of tags in use
system.cpu.dcache.total_refs 3329 # Total number of references to valid blocks.
system.cpu.dcache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.dcache.writebacks 0 # number of writebacks
system.cpu.decode.DECODE:BlockedCycles 4602 # Number of cycles decode is blocked
system.cpu.decode.DECODE:DecodedInsts 38937 # Number of instructions handled by decode
system.cpu.decode.DECODE:IdleCycles 16098 # Number of cycles decode is idle
system.cpu.decode.DECODE:RunCycles 7883 # Number of cycles decode is running
system.cpu.decode.DECODE:SquashCycles 3063 # Number of cycles decode is squashing
system.cpu.decode.DECODE:UnblockCycles 218 # Number of cycles decode is unblocking
system.cpu.fetch.Branches 7954 # Number of branches that fetch encountered
system.cpu.fetch.CacheLines 4933 # Number of cache lines fetched
system.cpu.fetch.Cycles 14166 # Number of cycles fetch has run and was not squashing or blocked
system.cpu.fetch.IcacheSquashes 565 # Number of outstanding Icache misses that were squashed
system.cpu.fetch.Insts 44421 # Number of instructions fetch has processed
system.cpu.fetch.SquashCycles 2121 # Number of cycles fetch has spent squashing
system.cpu.fetch.branchRate 0.249623 # Number of branch fetches per cycle
system.cpu.fetch.icacheStallCycles 4933 # Number of cycles fetch is stalled on an Icache miss
system.cpu.fetch.predictedBranches 2726 # Number of branches that fetch has predicted taken
system.cpu.fetch.rate 1.394081 # Number of inst fetches per cycle
system.cpu.decode.DECODE:BlockedCycles 3802 # Number of cycles decode is blocked
system.cpu.decode.DECODE:DecodedInsts 34098 # Number of instructions handled by decode
system.cpu.decode.DECODE:IdleCycles 15413 # Number of cycles decode is idle
system.cpu.decode.DECODE:RunCycles 9282 # Number of cycles decode is running
system.cpu.decode.DECODE:SquashCycles 2804 # Number of cycles decode is squashing
system.cpu.decode.DECODE:UnblockCycles 64 # Number of cycles decode is unblocking
system.cpu.fetch.Branches 6955 # Number of branches that fetch encountered
system.cpu.fetch.CacheLines 4655 # Number of cache lines fetched
system.cpu.fetch.Cycles 15062 # Number of cycles fetch has run and was not squashing or blocked
system.cpu.fetch.IcacheSquashes 489 # Number of outstanding Icache misses that were squashed
system.cpu.fetch.Insts 38520 # Number of instructions fetch has processed
system.cpu.fetch.SquashCycles 2061 # Number of cycles fetch has spent squashing
system.cpu.fetch.branchRate 0.221744 # Number of branch fetches per cycle
system.cpu.fetch.icacheStallCycles 4655 # Number of cycles fetch is stalled on an Icache miss
system.cpu.fetch.predictedBranches 2589 # Number of branches that fetch has predicted taken
system.cpu.fetch.rate 1.228121 # Number of inst fetches per cycle
system.cpu.fetch.rateDist.start_dist # Number of instructions fetched each cycle (Total)
system.cpu.fetch.rateDist.samples 31864
system.cpu.fetch.rateDist.samples 31365
system.cpu.fetch.rateDist.min_value 0
0 22632 7102.69%
1 2187 686.35%
2 562 176.37%
3 869 272.72%
4 521 163.51%
5 770 241.65%
6 886 278.06%
7 243 76.26%
8 3194 1002.39%
0 20959 6682.29%
1 4502 1435.36%
2 577 183.96%
3 682 217.44%
4 776 247.41%
5 629 200.54%
6 581 185.24%
7 189 60.26%
8 2470 787.50%
system.cpu.fetch.rateDist.max_value 8
system.cpu.fetch.rateDist.end_dist
system.cpu.icache.ReadReq_accesses 4933 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_avg_miss_latency 5310.666667 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency 4396.174863 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_hits 4558 # number of ReadReq hits
system.cpu.icache.ReadReq_miss_latency 1991500 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_rate 0.076019 # miss rate for ReadReq accesses
system.cpu.icache.ReadReq_misses 375 # number of ReadReq misses
system.cpu.icache.ReadReq_mshr_hits 9 # number of ReadReq MSHR hits
system.cpu.icache.ReadReq_mshr_miss_latency 1609000 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_rate 0.074194 # mshr miss rate for ReadReq accesses
system.cpu.icache.ReadReq_accesses 4655 # number of ReadReq accesses(hits+misses)
system.cpu.icache.ReadReq_avg_miss_latency 5308.823529 # average ReadReq miss latency
system.cpu.icache.ReadReq_avg_mshr_miss_latency 4382.513661 # average ReadReq mshr miss latency
system.cpu.icache.ReadReq_hits 4281 # number of ReadReq hits
system.cpu.icache.ReadReq_miss_latency 1985500 # number of ReadReq miss cycles
system.cpu.icache.ReadReq_miss_rate 0.080344 # miss rate for ReadReq accesses
system.cpu.icache.ReadReq_misses 374 # number of ReadReq misses
system.cpu.icache.ReadReq_mshr_hits 8 # number of ReadReq MSHR hits
system.cpu.icache.ReadReq_mshr_miss_latency 1604000 # number of ReadReq MSHR miss cycles
system.cpu.icache.ReadReq_mshr_miss_rate 0.078625 # mshr miss rate for ReadReq accesses
system.cpu.icache.ReadReq_mshr_misses 366 # number of ReadReq MSHR misses
system.cpu.icache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
system.cpu.icache.avg_blocked_cycles_no_targets <err: div-0> # average number of cycles each access was blocked
system.cpu.icache.avg_refs 12.453552 # Average number of references to valid blocks.
system.cpu.icache.avg_refs 11.696721 # Average number of references to valid blocks.
system.cpu.icache.blocked_no_mshrs 0 # number of cycles access was blocked
system.cpu.icache.blocked_no_targets 0 # number of cycles access was blocked
system.cpu.icache.blocked_cycles_no_mshrs 0 # number of cycles access was blocked
system.cpu.icache.blocked_cycles_no_targets 0 # number of cycles access was blocked
system.cpu.icache.cache_copies 0 # number of cache copies performed
system.cpu.icache.demand_accesses 4933 # number of demand (read+write) accesses
system.cpu.icache.demand_avg_miss_latency 5310.666667 # average overall miss latency
system.cpu.icache.demand_avg_mshr_miss_latency 4396.174863 # average overall mshr miss latency
system.cpu.icache.demand_hits 4558 # number of demand (read+write) hits
system.cpu.icache.demand_miss_latency 1991500 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_rate 0.076019 # miss rate for demand accesses
system.cpu.icache.demand_misses 375 # number of demand (read+write) misses
system.cpu.icache.demand_mshr_hits 9 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_miss_latency 1609000 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_rate 0.074194 # mshr miss rate for demand accesses
system.cpu.icache.demand_accesses 4655 # number of demand (read+write) accesses
system.cpu.icache.demand_avg_miss_latency 5308.823529 # average overall miss latency
system.cpu.icache.demand_avg_mshr_miss_latency 4382.513661 # average overall mshr miss latency
system.cpu.icache.demand_hits 4281 # number of demand (read+write) hits
system.cpu.icache.demand_miss_latency 1985500 # number of demand (read+write) miss cycles
system.cpu.icache.demand_miss_rate 0.080344 # miss rate for demand accesses
system.cpu.icache.demand_misses 374 # number of demand (read+write) misses
system.cpu.icache.demand_mshr_hits 8 # number of demand (read+write) MSHR hits
system.cpu.icache.demand_mshr_miss_latency 1604000 # number of demand (read+write) MSHR miss cycles
system.cpu.icache.demand_mshr_miss_rate 0.078625 # mshr miss rate for demand accesses
system.cpu.icache.demand_mshr_misses 366 # number of demand (read+write) MSHR misses
system.cpu.icache.fast_writes 0 # number of fast writes performed
system.cpu.icache.mshr_cap_events 0 # number of times MSHR cap was activated
system.cpu.icache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.icache.overall_accesses 4933 # number of overall (read+write) accesses
system.cpu.icache.overall_avg_miss_latency 5310.666667 # average overall miss latency
system.cpu.icache.overall_avg_mshr_miss_latency 4396.174863 # average overall mshr miss latency
system.cpu.icache.overall_accesses 4655 # number of overall (read+write) accesses
system.cpu.icache.overall_avg_miss_latency 5308.823529 # average overall miss latency
system.cpu.icache.overall_avg_mshr_miss_latency 4382.513661 # average overall mshr miss latency
system.cpu.icache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.icache.overall_hits 4558 # number of overall hits
system.cpu.icache.overall_miss_latency 1991500 # number of overall miss cycles
system.cpu.icache.overall_miss_rate 0.076019 # miss rate for overall accesses
system.cpu.icache.overall_misses 375 # number of overall misses
system.cpu.icache.overall_mshr_hits 9 # number of overall MSHR hits
system.cpu.icache.overall_mshr_miss_latency 1609000 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_rate 0.074194 # mshr miss rate for overall accesses
system.cpu.icache.overall_hits 4281 # number of overall hits
system.cpu.icache.overall_miss_latency 1985500 # number of overall miss cycles
system.cpu.icache.overall_miss_rate 0.080344 # miss rate for overall accesses
system.cpu.icache.overall_misses 374 # number of overall misses
system.cpu.icache.overall_mshr_hits 8 # number of overall MSHR hits
system.cpu.icache.overall_mshr_miss_latency 1604000 # number of overall MSHR miss cycles
system.cpu.icache.overall_mshr_miss_rate 0.078625 # mshr miss rate for overall accesses
system.cpu.icache.overall_mshr_misses 366 # number of overall MSHR misses
system.cpu.icache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
system.cpu.icache.overall_mshr_uncacheable_misses 0 # number of overall MSHR uncacheable misses
@ -217,59 +217,59 @@ system.cpu.icache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.icache.replacements 1 # number of replacements
system.cpu.icache.sampled_refs 366 # Sample count of references to valid blocks.
system.cpu.icache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.icache.tagsinuse 233.760012 # Cycle average of tags in use
system.cpu.icache.total_refs 4558 # Total number of references to valid blocks.
system.cpu.icache.tagsinuse 232.692086 # Cycle average of tags in use
system.cpu.icache.total_refs 4281 # Total number of references to valid blocks.
system.cpu.icache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.icache.writebacks 0 # number of writebacks
system.cpu.idleCycles 499 # Total number of cycles that the CPU has spent unscheduled due to idling
system.cpu.iew.EXEC:branches 3548 # Number of branches executed
system.cpu.idleCycles 1997 # Total number of cycles that the CPU has spent unscheduled due to idling
system.cpu.iew.EXEC:branches 3040 # Number of branches executed
system.cpu.iew.EXEC:nop 0 # number of nop insts executed
system.cpu.iew.EXEC:rate 0.670318 # Inst execution rate
system.cpu.iew.EXEC:refs 5385 # number of memory reference insts executed
system.cpu.iew.EXEC:stores 2502 # Number of stores executed
system.cpu.iew.EXEC:rate 0.582082 # Inst execution rate
system.cpu.iew.EXEC:refs 4490 # number of memory reference insts executed
system.cpu.iew.EXEC:stores 2077 # Number of stores executed
system.cpu.iew.EXEC:swp 0 # number of swp insts executed
system.cpu.iew.WB:consumers 10159 # num instructions consuming a value
system.cpu.iew.WB:count 20199 # cumulative count of insts written-back
system.cpu.iew.WB:fanout 0.790629 # average fanout of values written-back
system.cpu.iew.WB:consumers 8997 # num instructions consuming a value
system.cpu.iew.WB:count 17565 # cumulative count of insts written-back
system.cpu.iew.WB:fanout 0.831833 # average fanout of values written-back
system.cpu.iew.WB:penalized 0 # number of instrctions required to write to 'other' IQ
system.cpu.iew.WB:penalized_rate 0 # fraction of instructions written-back that wrote to 'other' IQ
system.cpu.iew.WB:producers 8032 # num instructions producing a value
system.cpu.iew.WB:rate 0.633913 # insts written-back per cycle
system.cpu.iew.WB:sent 20448 # cumulative count of insts sent to commit
system.cpu.iew.branchMispredicts 2568 # Number of branch mispredicts detected at execute
system.cpu.iew.WB:producers 7484 # num instructions producing a value
system.cpu.iew.WB:rate 0.560019 # insts written-back per cycle
system.cpu.iew.WB:sent 17724 # cumulative count of insts sent to commit
system.cpu.iew.branchMispredicts 2199 # Number of branch mispredicts detected at execute
system.cpu.iew.iewBlockCycles 0 # Number of cycles IEW is blocking
system.cpu.iew.iewDispLoadInsts 3198 # Number of dispatched load instructions
system.cpu.iew.iewDispNonSpecInsts 610 # Number of dispatched non-speculative instructions
system.cpu.iew.iewDispSquashedInsts 2750 # Number of squashed instructions skipped by dispatch
system.cpu.iew.iewDispStoreInsts 2970 # Number of dispatched store instructions
system.cpu.iew.iewDispatchedInsts 25274 # Number of instructions dispatched to IQ
system.cpu.iew.iewExecLoadInsts 2883 # Number of load instructions executed
system.cpu.iew.iewExecSquashedInsts 1463 # Number of squashed instructions skipped in execute
system.cpu.iew.iewExecutedInsts 21359 # Number of executed instructions
system.cpu.iew.iewDispLoadInsts 2999 # Number of dispatched load instructions
system.cpu.iew.iewDispNonSpecInsts 609 # Number of dispatched non-speculative instructions
system.cpu.iew.iewDispSquashedInsts 1287 # Number of squashed instructions skipped by dispatch
system.cpu.iew.iewDispStoreInsts 2872 # Number of dispatched store instructions
system.cpu.iew.iewDispatchedInsts 23636 # Number of instructions dispatched to IQ
system.cpu.iew.iewExecLoadInsts 2413 # Number of load instructions executed
system.cpu.iew.iewExecSquashedInsts 3118 # Number of squashed instructions skipped in execute
system.cpu.iew.iewExecutedInsts 18257 # Number of executed instructions
system.cpu.iew.iewIQFullEvents 0 # Number of times the IQ has become full, causing a stall
system.cpu.iew.iewIdleCycles 0 # Number of cycles IEW is idle
system.cpu.iew.iewLSQFullEvents 0 # Number of times the LSQ has become full, causing a stall
system.cpu.iew.iewSquashCycles 3063 # Number of cycles IEW is squashing
system.cpu.iew.iewSquashCycles 2804 # Number of cycles IEW is squashing
system.cpu.iew.iewUnblockCycles 0 # Number of cycles IEW is unblocking
system.cpu.iew.lsq.thread.0.blockedLoads 0 # Number of blocked loads due to partial load-store forwarding
system.cpu.iew.lsq.thread.0.cacheBlocked 0 # Number of times an access to memory failed due to the cache being blocked
system.cpu.iew.lsq.thread.0.forwLoads 48 # Number of loads that had data forwarded from stores
system.cpu.iew.lsq.thread.0.forwLoads 43 # Number of loads that had data forwarded from stores
system.cpu.iew.lsq.thread.0.ignoredResponses 8 # Number of memory responses ignored because the instruction is squashed
system.cpu.iew.lsq.thread.0.invAddrLoads 0 # Number of loads ignored due to an invalid address
system.cpu.iew.lsq.thread.0.invAddrSwpfs 0 # Number of software prefetches ignored due to an invalid address
system.cpu.iew.lsq.thread.0.memOrderViolation 52 # Number of memory ordering violations
system.cpu.iew.lsq.thread.0.rescheduledLoads 0 # Number of loads that were rescheduled
system.cpu.iew.lsq.thread.0.squashedLoads 1736 # Number of loads squashed
system.cpu.iew.lsq.thread.0.squashedStores 1672 # Number of stores squashed
system.cpu.iew.lsq.thread.0.squashedLoads 1537 # Number of loads squashed
system.cpu.iew.lsq.thread.0.squashedStores 1574 # Number of stores squashed
system.cpu.iew.memOrderViolationEvents 52 # Number of memory order violations
system.cpu.iew.predictedNotTakenIncorrect 958 # Number of branches that were predicted not taken incorrectly
system.cpu.iew.predictedTakenIncorrect 1610 # Number of branches that were predicted taken incorrectly
system.cpu.ipc 0.344464 # IPC: Instructions Per Cycle
system.cpu.ipc_total 0.344464 # IPC: Total IPC of All Threads
system.cpu.iq.ISSUE:FU_type_0 22822 # Type of FU issued
system.cpu.iew.predictedNotTakenIncorrect 682 # Number of branches that were predicted not taken incorrectly
system.cpu.iew.predictedTakenIncorrect 1517 # Number of branches that were predicted taken incorrectly
system.cpu.ipc 0.349944 # IPC: Instructions Per Cycle
system.cpu.ipc_total 0.349944 # IPC: Total IPC of All Threads
system.cpu.iq.ISSUE:FU_type_0 21375 # Type of FU issued
system.cpu.iq.ISSUE:FU_type_0.start_dist
(null) 1826 8.00% # Type of FU issued
IntAlu 15247 66.81% # Type of FU issued
No_OpClass 1750 8.19% # Type of FU issued
IntAlu 14209 66.47% # Type of FU issued
IntMult 0 0.00% # Type of FU issued
IntDiv 0 0.00% # Type of FU issued
FloatAdd 0 0.00% # Type of FU issued
@ -278,16 +278,16 @@ system.cpu.iq.ISSUE:FU_type_0.start_dist
FloatMult 0 0.00% # Type of FU issued
FloatDiv 0 0.00% # Type of FU issued
FloatSqrt 0 0.00% # Type of FU issued
MemRead 3042 13.33% # Type of FU issued
MemWrite 2707 11.86% # Type of FU issued
MemRead 2832 13.25% # Type of FU issued
MemWrite 2584 12.09% # Type of FU issued
IprAccess 0 0.00% # Type of FU issued
InstPrefetch 0 0.00% # Type of FU issued
system.cpu.iq.ISSUE:FU_type_0.end_dist
system.cpu.iq.ISSUE:fu_busy_cnt 190 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_rate 0.008325 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_busy_cnt 160 # FU busy when requested
system.cpu.iq.ISSUE:fu_busy_rate 0.007485 # FU busy rate (busy events/executed inst)
system.cpu.iq.ISSUE:fu_full.start_dist
(null) 0 0.00% # attempts to use FU when none available
IntAlu 50 26.32% # attempts to use FU when none available
No_OpClass 0 0.00% # attempts to use FU when none available
IntAlu 27 16.88% # attempts to use FU when none available
IntMult 0 0.00% # attempts to use FU when none available
IntDiv 0 0.00% # attempts to use FU when none available
FloatAdd 0 0.00% # attempts to use FU when none available
@ -296,41 +296,41 @@ system.cpu.iq.ISSUE:fu_full.start_dist
FloatMult 0 0.00% # attempts to use FU when none available
FloatDiv 0 0.00% # attempts to use FU when none available
FloatSqrt 0 0.00% # attempts to use FU when none available
MemRead 25 13.16% # attempts to use FU when none available
MemWrite 115 60.53% # attempts to use FU when none available
MemRead 23 14.37% # attempts to use FU when none available
MemWrite 110 68.75% # attempts to use FU when none available
IprAccess 0 0.00% # attempts to use FU when none available
InstPrefetch 0 0.00% # attempts to use FU when none available
system.cpu.iq.ISSUE:fu_full.end_dist
system.cpu.iq.ISSUE:issued_per_cycle.start_dist # Number of insts issued each cycle
system.cpu.iq.ISSUE:issued_per_cycle.samples 31864
system.cpu.iq.ISSUE:issued_per_cycle.samples 31365
system.cpu.iq.ISSUE:issued_per_cycle.min_value 0
0 22879 7180.20%
1 3824 1200.10%
2 1304 409.24%
3 1251 392.61%
4 1252 392.92%
5 751 235.69%
6 414 129.93%
7 122 38.29%
8 67 21.03%
0 21827 6959.03%
1 4212 1342.90%
2 2084 664.43%
3 1568 499.92%
4 766 244.22%
5 454 144.75%
6 283 90.23%
7 109 34.75%
8 62 19.77%
system.cpu.iq.ISSUE:issued_per_cycle.max_value 8
system.cpu.iq.ISSUE:issued_per_cycle.end_dist
system.cpu.iq.ISSUE:rate 0.716231 # Inst issue rate
system.cpu.iq.iqInstsAdded 24664 # Number of instructions added to the IQ (excludes non-spec)
system.cpu.iq.iqInstsIssued 22822 # Number of instructions issued
system.cpu.iq.iqNonSpecInstsAdded 610 # Number of non-speculative instructions added to the IQ
system.cpu.iq.iqSquashedInstsExamined 11119 # Number of squashed instructions iterated over during squash; mainly for profiling
system.cpu.iq.iqSquashedInstsIssued 83 # Number of squashed instructions issued
system.cpu.iq.iqSquashedNonSpecRemoved 283 # Number of squashed non-spec instructions that were removed
system.cpu.iq.iqSquashedOperandsExamined 5685 # Number of squashed operands that are examined and possibly removed from graph
system.cpu.iq.ISSUE:rate 0.681492 # Inst issue rate
system.cpu.iq.iqInstsAdded 23027 # Number of instructions added to the IQ (excludes non-spec)
system.cpu.iq.iqInstsIssued 21375 # Number of instructions issued
system.cpu.iq.iqNonSpecInstsAdded 609 # Number of non-speculative instructions added to the IQ
system.cpu.iq.iqSquashedInstsExamined 10843 # Number of squashed instructions iterated over during squash; mainly for profiling
system.cpu.iq.iqSquashedInstsIssued 99 # Number of squashed instructions issued
system.cpu.iq.iqSquashedNonSpecRemoved 280 # Number of squashed non-spec instructions that were removed
system.cpu.iq.iqSquashedOperandsExamined 7823 # Number of squashed operands that are examined and possibly removed from graph
system.cpu.l2cache.ReadReq_accesses 514 # number of ReadReq accesses(hits+misses)
system.cpu.l2cache.ReadReq_avg_miss_latency 4458.171206 # average ReadReq miss latency
system.cpu.l2cache.ReadReq_avg_mshr_miss_latency 2373.540856 # average ReadReq mshr miss latency
system.cpu.l2cache.ReadReq_avg_mshr_miss_latency 2375.486381 # average ReadReq mshr miss latency
system.cpu.l2cache.ReadReq_miss_latency 2291500 # number of ReadReq miss cycles
system.cpu.l2cache.ReadReq_miss_rate 1 # miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_misses 514 # number of ReadReq misses
system.cpu.l2cache.ReadReq_mshr_miss_latency 1220000 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_latency 1221000 # number of ReadReq MSHR miss cycles
system.cpu.l2cache.ReadReq_mshr_miss_rate 1 # mshr miss rate for ReadReq accesses
system.cpu.l2cache.ReadReq_mshr_misses 514 # number of ReadReq MSHR misses
system.cpu.l2cache.avg_blocked_cycles_no_mshrs <err: div-0> # average number of cycles each access was blocked
@ -343,13 +343,13 @@ system.cpu.l2cache.blocked_cycles_no_targets 0
system.cpu.l2cache.cache_copies 0 # number of cache copies performed
system.cpu.l2cache.demand_accesses 514 # number of demand (read+write) accesses
system.cpu.l2cache.demand_avg_miss_latency 4458.171206 # average overall miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency 2373.540856 # average overall mshr miss latency
system.cpu.l2cache.demand_avg_mshr_miss_latency 2375.486381 # average overall mshr miss latency
system.cpu.l2cache.demand_hits 0 # number of demand (read+write) hits
system.cpu.l2cache.demand_miss_latency 2291500 # number of demand (read+write) miss cycles
system.cpu.l2cache.demand_miss_rate 1 # miss rate for demand accesses
system.cpu.l2cache.demand_misses 514 # number of demand (read+write) misses
system.cpu.l2cache.demand_mshr_hits 0 # number of demand (read+write) MSHR hits
system.cpu.l2cache.demand_mshr_miss_latency 1220000 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_latency 1221000 # number of demand (read+write) MSHR miss cycles
system.cpu.l2cache.demand_mshr_miss_rate 1 # mshr miss rate for demand accesses
system.cpu.l2cache.demand_mshr_misses 514 # number of demand (read+write) MSHR misses
system.cpu.l2cache.fast_writes 0 # number of fast writes performed
@ -357,14 +357,14 @@ system.cpu.l2cache.mshr_cap_events 0 # nu
system.cpu.l2cache.no_allocate_misses 0 # Number of misses that were no-allocate
system.cpu.l2cache.overall_accesses 514 # number of overall (read+write) accesses
system.cpu.l2cache.overall_avg_miss_latency 4458.171206 # average overall miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency 2373.540856 # average overall mshr miss latency
system.cpu.l2cache.overall_avg_mshr_miss_latency 2375.486381 # average overall mshr miss latency
system.cpu.l2cache.overall_avg_mshr_uncacheable_latency <err: div-0> # average overall mshr uncacheable latency
system.cpu.l2cache.overall_hits 0 # number of overall hits
system.cpu.l2cache.overall_miss_latency 2291500 # number of overall miss cycles
system.cpu.l2cache.overall_miss_rate 1 # miss rate for overall accesses
system.cpu.l2cache.overall_misses 514 # number of overall misses
system.cpu.l2cache.overall_mshr_hits 0 # number of overall MSHR hits
system.cpu.l2cache.overall_mshr_miss_latency 1220000 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_latency 1221000 # number of overall MSHR miss cycles
system.cpu.l2cache.overall_mshr_miss_rate 1 # mshr miss rate for overall accesses
system.cpu.l2cache.overall_mshr_misses 514 # number of overall MSHR misses
system.cpu.l2cache.overall_mshr_uncacheable_latency 0 # number of overall MSHR uncacheable cycles
@ -381,26 +381,25 @@ system.cpu.l2cache.prefetcher.num_hwpf_squashed_from_miss 0
system.cpu.l2cache.replacements 0 # number of replacements
system.cpu.l2cache.sampled_refs 514 # Sample count of references to valid blocks.
system.cpu.l2cache.soft_prefetch_mshr_full 0 # number of mshr full events for SW prefetching instrutions
system.cpu.l2cache.tagsinuse 345.564898 # Cycle average of tags in use
system.cpu.l2cache.tagsinuse 344.125692 # Cycle average of tags in use
system.cpu.l2cache.total_refs 0 # Total number of references to valid blocks.
system.cpu.l2cache.warmup_cycle 0 # Cycle when the warmup percentage was hit.
system.cpu.l2cache.writebacks 0 # number of writebacks
system.cpu.numCycles 31864 # number of cpu cycles simulated
system.cpu.numCycles 31365 # number of cpu cycles simulated
system.cpu.rename.RENAME:CommittedMaps 9868 # Number of HB maps that are committed
system.cpu.rename.RENAME:IdleCycles 16082 # Number of cycles rename is idle
system.cpu.rename.RENAME:RenameLookups 44650 # Number of register rename lookups that rename has made
system.cpu.rename.RENAME:RenamedInsts 29655 # Number of instructions processed by rename
system.cpu.rename.RENAME:RenamedOperands 24195 # Number of destination operands rename has renamed
system.cpu.rename.RENAME:RunCycles 7618 # Number of cycles rename is running
system.cpu.rename.RENAME:SquashCycles 3063 # Number of cycles rename is squashing
system.cpu.rename.RENAME:SquashedInsts 8815 # Number of squashed instructions processed by rename
system.cpu.rename.RENAME:UnblockCycles 684 # Number of cycles rename is unblocking
system.cpu.rename.RENAME:UndoneMaps 14327 # Number of HB maps that are undone due to squashing
system.cpu.rename.RENAME:serializeStallCycles 3915 # count of cycles rename stalled for serializing inst
system.cpu.rename.RENAME:serializingInsts 631 # count of serializing insts renamed
system.cpu.rename.RENAME:skidInsts 4702 # count of insts added to the skid buffer
system.cpu.rename.RENAME:tempSerializingInsts 623 # count of temporary serializing insts renamed
system.cpu.timesIdled 1 # Number of times that the entire CPU went into an idle state and unscheduled itself
system.cpu.rename.RENAME:IdleCycles 16585 # Number of cycles rename is idle
system.cpu.rename.RENAME:RenameLookups 46161 # Number of register rename lookups that rename has made
system.cpu.rename.RENAME:RenamedInsts 26550 # Number of instructions processed by rename
system.cpu.rename.RENAME:RenamedOperands 21893 # Number of destination operands rename has renamed
system.cpu.rename.RENAME:RunCycles 8196 # Number of cycles rename is running
system.cpu.rename.RENAME:SquashCycles 2804 # Number of cycles rename is squashing
system.cpu.rename.RENAME:UnblockCycles 229 # Number of cycles rename is unblocking
system.cpu.rename.RENAME:UndoneMaps 12025 # Number of HB maps that are undone due to squashing
system.cpu.rename.RENAME:serializeStallCycles 3551 # count of cycles rename stalled for serializing inst
system.cpu.rename.RENAME:serializingInsts 628 # count of serializing insts renamed
system.cpu.rename.RENAME:skidInsts 4297 # count of insts added to the skid buffer
system.cpu.rename.RENAME:tempSerializingInsts 640 # count of temporary serializing insts renamed
system.cpu.timesIdled 3 # Number of times that the entire CPU went into an idle state and unscheduled itself
system.cpu.workload.PROG:num_syscalls 8 # Number of system calls
---------- End Simulation Statistics ----------

View file

@ -16,9 +16,9 @@ The Regents of The University of Michigan
All Rights Reserved
M5 compiled May 15 2007 13:02:31
M5 started Tue May 15 17:00:06 2007
M5 compiled Jun 21 2007 21:15:48
M5 started Fri Jun 22 00:32:08 2007
M5 executing on zizzer.eecs.umich.edu
command line: build/SPARC_SE/m5.fast -d build/SPARC_SE/tests/fast/quick/02.insttest/sparc/linux/o3-timing tests/run.py quick/02.insttest/sparc/linux/o3-timing
Global frequency set at 1000000000000 ticks per second
Exiting @ tick 15931500 because target called exit()
Exiting @ tick 15682500 because target called exit()