61d95de4c8
SConscript: arch/isa_parser.py: cpu/base_dyn_inst.cc: Remove OOO CPU stuff. arch/alpha/faults.hh: Add fake memory fault. This will be removed eventually. arch/alpha/isa_desc: Change EA comp and Mem accessor to be const StaticInstPtrs. cpu/base_dyn_inst.hh: Update read/write calls to use load queue and store queue indices. cpu/beta_cpu/alpha_dyn_inst.hh: Change to const StaticInst in the register accessors. cpu/beta_cpu/alpha_dyn_inst_impl.hh: Update syscall code with thread numbers. cpu/beta_cpu/alpha_full_cpu.hh: Alter some of the full system code so it will compile without errors. cpu/beta_cpu/alpha_full_cpu_builder.cc: Created a DerivAlphaFullCPU class so I can instantiate different CPUs that have different template parameters. cpu/beta_cpu/alpha_full_cpu_impl.hh: Update some of the full system code so it compiles. cpu/beta_cpu/alpha_params.hh: cpu/beta_cpu/fetch_impl.hh: Remove asid. cpu/beta_cpu/comm.hh: Remove global history field. cpu/beta_cpu/commit.hh: Comment out rename map. cpu/beta_cpu/commit_impl.hh: Update some of the full system code so it compiles. Also change it so that it handles memory instructions properly. cpu/beta_cpu/cpu_policy.hh: Removed IQ from the IEW template parameter to make it more uniform. cpu/beta_cpu/decode.hh: Add debug function. cpu/beta_cpu/decode_impl.hh: Slight updates for decode in the case where it causes a squash. cpu/beta_cpu/fetch.hh: cpu/beta_cpu/rob.hh: Comment out unneccessary code. cpu/beta_cpu/full_cpu.cc: Changed some of the full system code so it compiles. Updated exec contexts and so forth to hopefully make multithreading easier. cpu/beta_cpu/full_cpu.hh: Updated some of the full system code to make it compile. cpu/beta_cpu/iew.cc: Removed IQ from template parameter to IEW. cpu/beta_cpu/iew.hh: Removed IQ from template parameter to IEW. Updated IEW to recognize the Load/Store queue. cpu/beta_cpu/iew_impl.hh: New handling of memory instructions through the Load/Store queue. cpu/beta_cpu/inst_queue.hh: Updated comment. cpu/beta_cpu/inst_queue_impl.hh: Slightly different handling of memory instructions due to Load/Store queue. cpu/beta_cpu/regfile.hh: Updated full system code so it compiles. cpu/beta_cpu/rob_impl.hh: Moved some code around; no major functional changes. cpu/ooo_cpu/ooo_cpu.hh: Slight updates to OOO CPU; still does not work. cpu/static_inst.hh: Remove OOO CPU stuff. Change ea comp and mem acc to return const StaticInst. kern/kernel_stats.hh: Extra forward declares added due to compile error. --HG-- extra : convert_revision : 594a7cdbe57f6c2bda7d08856fcd864604a6238e
308 lines
9.6 KiB
C++
308 lines
9.6 KiB
C++
#ifndef __INST_QUEUE_HH__
|
|
#define __INST_QUEUE_HH__
|
|
|
|
#include <list>
|
|
#include <map>
|
|
#include <queue>
|
|
#include <stdint.h>
|
|
#include <vector>
|
|
|
|
#include "base/statistics.hh"
|
|
#include "base/timebuf.hh"
|
|
#include "cpu/inst_seq.hh"
|
|
|
|
/**
|
|
* A standard instruction queue class. It holds instructions in an
|
|
* array, holds the ordering of the instructions within a linked list,
|
|
* and tracks producer/consumer dependencies within a separate linked
|
|
* list. Similar to the rename map and the free list, it expects that
|
|
* floating point registers have their indices start after the integer
|
|
* registers (ie with 96 int and 96 fp registers, regs 0-95 are integer
|
|
* and 96-191 are fp). This remains true even for both logical and
|
|
* physical register indices.
|
|
*/
|
|
template <class Impl>
|
|
class InstructionQueue
|
|
{
|
|
public:
|
|
//Typedefs from the Impl.
|
|
typedef typename Impl::FullCPU FullCPU;
|
|
typedef typename Impl::DynInstPtr DynInstPtr;
|
|
typedef typename Impl::Params Params;
|
|
|
|
typedef typename Impl::CPUPol::MemDepUnit MemDepUnit;
|
|
typedef typename Impl::CPUPol::IssueStruct IssueStruct;
|
|
typedef typename Impl::CPUPol::TimeStruct TimeStruct;
|
|
|
|
// Typedef of iterator through the list of instructions. Might be
|
|
// better to untie this from the FullCPU or pass its information to
|
|
// the stages.
|
|
typedef typename std::list<DynInstPtr>::iterator ListIt;
|
|
|
|
/**
|
|
* Struct for comparing entries to be added to the priority queue. This
|
|
* gives reverse ordering to the instructions in terms of sequence
|
|
* numbers: the instructions with smaller sequence numbers (and hence
|
|
* are older) will be at the top of the priority queue.
|
|
*/
|
|
struct pqCompare
|
|
{
|
|
bool operator() (const DynInstPtr &lhs, const DynInstPtr &rhs) const
|
|
{
|
|
return lhs->seqNum > rhs->seqNum;
|
|
}
|
|
};
|
|
|
|
/**
|
|
* Struct for comparing entries to be added to the set. This gives
|
|
* standard ordering in terms of sequence numbers.
|
|
*/
|
|
struct setCompare
|
|
{
|
|
bool operator() (const DynInstPtr &lhs, const DynInstPtr &rhs) const
|
|
{
|
|
return lhs->seqNum < rhs->seqNum;
|
|
}
|
|
};
|
|
|
|
typedef std::priority_queue<DynInstPtr, vector<DynInstPtr>, pqCompare>
|
|
ReadyInstQueue;
|
|
|
|
InstructionQueue(Params ¶ms);
|
|
|
|
void regStats();
|
|
|
|
void setCPU(FullCPU *cpu);
|
|
|
|
void setIssueToExecuteQueue(TimeBuffer<IssueStruct> *i2eQueue);
|
|
|
|
void setTimeBuffer(TimeBuffer<TimeStruct> *tb_ptr);
|
|
|
|
unsigned numFreeEntries();
|
|
|
|
bool isFull();
|
|
|
|
void insert(DynInstPtr &new_inst);
|
|
|
|
void insertNonSpec(DynInstPtr &new_inst);
|
|
|
|
void advanceTail(DynInstPtr &inst);
|
|
|
|
void scheduleReadyInsts();
|
|
|
|
void scheduleNonSpec(const InstSeqNum &inst);
|
|
|
|
void wakeDependents(DynInstPtr &completed_inst);
|
|
|
|
void violation(DynInstPtr &store, DynInstPtr &faulting_load);
|
|
|
|
// Change this to take in the sequence number
|
|
void squash();
|
|
|
|
void doSquash();
|
|
|
|
void stopSquash();
|
|
|
|
/** Debugging function to dump all the list sizes, as well as print
|
|
* out the list of nonspeculative instructions. Should not be used
|
|
* in any other capacity, but it has no harmful sideaffects.
|
|
*/
|
|
void dumpLists();
|
|
|
|
private:
|
|
/** Debugging function to count how many entries are in the IQ. It does
|
|
* a linear walk through the instructions, so do not call this function
|
|
* during normal execution.
|
|
*/
|
|
int countInsts();
|
|
|
|
private:
|
|
/** Pointer to the CPU. */
|
|
FullCPU *cpu;
|
|
|
|
/** The memory dependence unit, which tracks/predicts memory dependences
|
|
* between instructions.
|
|
*/
|
|
MemDepUnit memDepUnit;
|
|
|
|
/** The queue to the execute stage. Issued instructions will be written
|
|
* into it.
|
|
*/
|
|
TimeBuffer<IssueStruct> *issueToExecuteQueue;
|
|
|
|
/** The backwards time buffer. */
|
|
TimeBuffer<TimeStruct> *timeBuffer;
|
|
|
|
/** Wire to read information from timebuffer. */
|
|
typename TimeBuffer<TimeStruct>::wire fromCommit;
|
|
|
|
enum InstList {
|
|
Int,
|
|
Float,
|
|
Branch,
|
|
Memory,
|
|
Misc,
|
|
Squashed,
|
|
None
|
|
};
|
|
|
|
/** List of ready int instructions. Used to keep track of the order in
|
|
* which instructions should issue.
|
|
*/
|
|
ReadyInstQueue readyIntInsts;
|
|
|
|
/** List of ready floating point instructions. */
|
|
ReadyInstQueue readyFloatInsts;
|
|
|
|
/** List of ready branch instructions. */
|
|
ReadyInstQueue readyBranchInsts;
|
|
|
|
/** List of ready memory instructions. */
|
|
// ReadyInstQueue readyMemInsts;
|
|
|
|
/** List of ready miscellaneous instructions. */
|
|
ReadyInstQueue readyMiscInsts;
|
|
|
|
/** List of squashed instructions (which are still valid and in IQ).
|
|
* Implemented using a priority queue; the entries must contain both
|
|
* the IQ index and sequence number of each instruction so that
|
|
* ordering based on sequence numbers can be used.
|
|
*/
|
|
ReadyInstQueue squashedInsts;
|
|
|
|
/** List of non-speculative instructions that will be scheduled
|
|
* once the IQ gets a signal from commit. While it's redundant to
|
|
* have the key be a part of the value (the sequence number is stored
|
|
* inside of DynInst), when these instructions are woken up only
|
|
* the sequence number will be available. Thus it is most efficient to be
|
|
* able to search by the sequence number alone.
|
|
*/
|
|
std::map<InstSeqNum, DynInstPtr> nonSpecInsts;
|
|
|
|
typedef typename std::map<InstSeqNum, DynInstPtr>::iterator non_spec_it_t;
|
|
|
|
/** Number of free IQ entries left. */
|
|
unsigned freeEntries;
|
|
|
|
/** The number of entries in the instruction queue. */
|
|
unsigned numEntries;
|
|
|
|
/** The number of integer instructions that can be issued in one
|
|
* cycle.
|
|
*/
|
|
unsigned intWidth;
|
|
|
|
/** The number of floating point instructions that can be issued
|
|
* in one cycle.
|
|
*/
|
|
unsigned floatWidth;
|
|
|
|
/** The number of branches that can be issued in one cycle. */
|
|
unsigned branchWidth;
|
|
|
|
/** The number of memory instructions that can be issued in one cycle. */
|
|
unsigned memoryWidth;
|
|
|
|
/** The total number of instructions that can be issued in one cycle. */
|
|
unsigned totalWidth;
|
|
|
|
//The number of physical registers in the CPU.
|
|
unsigned numPhysRegs;
|
|
|
|
/** The number of physical integer registers in the CPU. */
|
|
unsigned numPhysIntRegs;
|
|
|
|
/** The number of floating point registers in the CPU. */
|
|
unsigned numPhysFloatRegs;
|
|
|
|
/** Delay between commit stage and the IQ.
|
|
* @todo: Make there be a distinction between the delays within IEW.
|
|
*/
|
|
unsigned commitToIEWDelay;
|
|
|
|
//////////////////////////////////
|
|
// Variables needed for squashing
|
|
//////////////////////////////////
|
|
|
|
/** The sequence number of the squashed instruction. */
|
|
InstSeqNum squashedSeqNum;
|
|
|
|
/** Iterator that points to the youngest instruction in the IQ. */
|
|
ListIt tail;
|
|
|
|
/** Iterator that points to the last instruction that has been squashed.
|
|
* This will not be valid unless the IQ is in the process of squashing.
|
|
*/
|
|
ListIt squashIt;
|
|
|
|
///////////////////////////////////
|
|
// Dependency graph stuff
|
|
///////////////////////////////////
|
|
|
|
class DependencyEntry
|
|
{
|
|
public:
|
|
DynInstPtr inst;
|
|
//Might want to include data about what arch. register the
|
|
//dependence is waiting on.
|
|
DependencyEntry *next;
|
|
|
|
//This function, and perhaps this whole class, stand out a little
|
|
//bit as they don't fit a classification well. I want access
|
|
//to the underlying structure of the linked list, yet at
|
|
//the same time it feels like this should be something abstracted
|
|
//away. So for now it will sit here, within the IQ, until
|
|
//a better implementation is decided upon.
|
|
// This function probably shouldn't be within the entry...
|
|
void insert(DynInstPtr &new_inst);
|
|
|
|
void remove(DynInstPtr &inst_to_remove);
|
|
|
|
// Debug variable, remove when done testing.
|
|
static unsigned mem_alloc_counter;
|
|
};
|
|
|
|
/** Array of linked lists. Each linked list is a list of all the
|
|
* instructions that depend upon a given register. The actual
|
|
* register's index is used to index into the graph; ie all
|
|
* instructions in flight that are dependent upon r34 will be
|
|
* in the linked list of dependGraph[34].
|
|
*/
|
|
DependencyEntry *dependGraph;
|
|
|
|
/** A cache of the recently woken registers. It is 1 if the register
|
|
* has been woken up recently, and 0 if the register has been added
|
|
* to the dependency graph and has not yet received its value. It
|
|
* is basically a secondary scoreboard, and should pretty much mirror
|
|
* the scoreboard that exists in the rename map.
|
|
*/
|
|
vector<bool> regScoreboard;
|
|
|
|
bool addToDependents(DynInstPtr &new_inst);
|
|
void insertDependency(DynInstPtr &new_inst);
|
|
void createDependency(DynInstPtr &new_inst);
|
|
void dumpDependGraph();
|
|
|
|
void addIfReady(DynInstPtr &inst);
|
|
|
|
Stats::Scalar<> iqInstsAdded;
|
|
Stats::Scalar<> iqNonSpecInstsAdded;
|
|
// Stats::Scalar<> iqIntInstsAdded;
|
|
Stats::Scalar<> iqIntInstsIssued;
|
|
// Stats::Scalar<> iqFloatInstsAdded;
|
|
Stats::Scalar<> iqFloatInstsIssued;
|
|
// Stats::Scalar<> iqBranchInstsAdded;
|
|
Stats::Scalar<> iqBranchInstsIssued;
|
|
// Stats::Scalar<> iqMemInstsAdded;
|
|
Stats::Scalar<> iqMemInstsIssued;
|
|
// Stats::Scalar<> iqMiscInstsAdded;
|
|
Stats::Scalar<> iqMiscInstsIssued;
|
|
Stats::Scalar<> iqSquashedInstsIssued;
|
|
Stats::Scalar<> iqLoopSquashStalls;
|
|
Stats::Scalar<> iqSquashedInstsExamined;
|
|
Stats::Scalar<> iqSquashedOperandsExamined;
|
|
Stats::Scalar<> iqSquashedNonSpecRemoved;
|
|
|
|
};
|
|
|
|
#endif //__INST_QUEUE_HH__
|