984c2a4ff6
into zamp.eecs.umich.edu:/z/ktlim2/clean/newmem-merge src/cpu/checker/o3_cpu_builder.cc: src/cpu/o3/alpha_cpu.hh: src/cpu/o3/alpha_cpu_impl.hh: src/cpu/o3/alpha_dyn_inst_impl.hh: src/cpu/o3/bpred_unit.cc: src/cpu/o3/commit.hh: src/cpu/o3/fetch_impl.hh: src/cpu/o3/lsq_unit.hh: src/cpu/o3/lsq_unit_impl.hh: src/cpu/o3/thread_state.hh: Hand merge. --HG-- rename : cpu/activity.cc => src/cpu/activity.cc rename : cpu/activity.hh => src/cpu/activity.hh rename : cpu/base_dyn_inst.cc => src/cpu/base_dyn_inst.cc rename : cpu/checker/cpu.hh => src/cpu/checker/cpu.hh rename : cpu/checker/cpu_builder.cc => src/cpu/checker/cpu_builder.cc rename : cpu/checker/exec_context.hh => src/cpu/checker/exec_context.hh rename : cpu/checker/o3_cpu_builder.cc => src/cpu/checker/o3_cpu_builder.cc rename : cpu/o3/2bit_local_pred.cc => src/cpu/o3/2bit_local_pred.cc rename : cpu/o3/2bit_local_pred.hh => src/cpu/o3/2bit_local_pred.hh rename : cpu/o3/alpha_cpu.hh => src/cpu/o3/alpha_cpu.hh rename : cpu/o3/alpha_cpu_builder.cc => src/cpu/o3/alpha_cpu_builder.cc rename : cpu/o3/alpha_cpu_impl.hh => src/cpu/o3/alpha_cpu_impl.hh rename : cpu/o3/alpha_dyn_inst.hh => src/cpu/o3/alpha_dyn_inst.hh rename : cpu/o3/alpha_dyn_inst_impl.hh => src/cpu/o3/alpha_dyn_inst_impl.hh rename : cpu/o3/alpha_params.hh => src/cpu/o3/alpha_params.hh rename : cpu/o3/bpred_unit.cc => src/cpu/o3/bpred_unit.cc rename : cpu/o3/bpred_unit.hh => src/cpu/o3/bpred_unit.hh rename : cpu/o3/bpred_unit_impl.hh => src/cpu/o3/bpred_unit_impl.hh rename : cpu/o3/comm.hh => src/cpu/o3/comm.hh rename : cpu/o3/commit.hh => src/cpu/o3/commit.hh rename : cpu/o3/commit_impl.hh => src/cpu/o3/commit_impl.hh rename : cpu/o3/cpu.hh => src/cpu/o3/cpu.hh rename : cpu/o3/cpu_policy.hh => src/cpu/o3/cpu_policy.hh rename : cpu/o3/decode.hh => src/cpu/o3/decode.hh rename : cpu/o3/decode_impl.hh => src/cpu/o3/decode_impl.hh rename : cpu/o3/dep_graph.hh => src/cpu/o3/dep_graph.hh rename : cpu/o3/fetch.hh => src/cpu/o3/fetch.hh rename : cpu/o3/fetch_impl.hh => src/cpu/o3/fetch_impl.hh rename : cpu/o3/fu_pool.cc => src/cpu/o3/fu_pool.cc rename : cpu/o3/fu_pool.hh => src/cpu/o3/fu_pool.hh rename : cpu/o3/iew.hh => src/cpu/o3/iew.hh rename : cpu/o3/iew_impl.hh => src/cpu/o3/iew_impl.hh rename : cpu/o3/inst_queue.hh => src/cpu/o3/inst_queue.hh rename : cpu/o3/inst_queue_impl.hh => src/cpu/o3/inst_queue_impl.hh rename : cpu/o3/lsq.hh => src/cpu/o3/lsq.hh rename : cpu/o3/lsq_unit.hh => src/cpu/o3/lsq_unit.hh rename : cpu/o3/lsq_unit_impl.hh => src/cpu/o3/lsq_unit_impl.hh rename : cpu/o3/mem_dep_unit.hh => src/cpu/o3/mem_dep_unit.hh rename : cpu/o3/mem_dep_unit_impl.hh => src/cpu/o3/mem_dep_unit_impl.hh rename : cpu/o3/rename.hh => src/cpu/o3/rename.hh rename : cpu/o3/rename_impl.hh => src/cpu/o3/rename_impl.hh rename : cpu/o3/rename_map.hh => src/cpu/o3/rename_map.hh rename : cpu/o3/rob.hh => src/cpu/o3/rob.hh rename : cpu/o3/store_set.cc => src/cpu/o3/store_set.cc rename : cpu/o3/store_set.hh => src/cpu/o3/store_set.hh rename : cpu/o3/thread_state.hh => src/cpu/o3/thread_state.hh rename : cpu/o3/tournament_pred.cc => src/cpu/o3/tournament_pred.cc rename : cpu/o3/tournament_pred.hh => src/cpu/o3/tournament_pred.hh rename : cpu/ozone/cpu_builder.cc => src/cpu/ozone/cpu_builder.cc rename : cpu/ozone/ozone_impl.hh => src/cpu/ozone/ozone_impl.hh rename : cpu/ozone/simple_impl.hh => src/cpu/ozone/simple_impl.hh rename : cpu/ozone/simple_params.hh => src/cpu/ozone/simple_params.hh rename : python/m5/objects/AlphaFullCPU.py => src/python/m5/objects/AlphaFullCPU.py rename : python/m5/objects/OzoneCPU.py => src/python/m5/objects/OzoneCPU.py extra : convert_revision : b7be30474dd03dd3970e737a9d0489aeb2ead84f
147 lines
4.9 KiB
C++
147 lines
4.9 KiB
C++
/*
|
|
* Copyright (c) 2004-2005 The Regents of The University of Michigan
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions are
|
|
* met: redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer;
|
|
* redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution;
|
|
* neither the name of the copyright holders nor the names of its
|
|
* contributors may be used to endorse or promote products derived from
|
|
* this software without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*
|
|
* Authors: Kevin Lim
|
|
*/
|
|
|
|
#ifndef __CPU_O3_STORE_SET_HH__
|
|
#define __CPU_O3_STORE_SET_HH__
|
|
|
|
#include <list>
|
|
#include <map>
|
|
#include <utility>
|
|
#include <vector>
|
|
|
|
#include "arch/isa_traits.hh"
|
|
#include "cpu/inst_seq.hh"
|
|
|
|
struct ltseqnum {
|
|
bool operator()(const InstSeqNum &lhs, const InstSeqNum &rhs) const
|
|
{
|
|
return lhs > rhs;
|
|
}
|
|
};
|
|
|
|
/**
|
|
* Implements a store set predictor for determining if memory
|
|
* instructions are dependent upon each other. See paper "Memory
|
|
* Dependence Prediction using Store Sets" by Chrysos and Emer. SSID
|
|
* stands for Store Set ID, SSIT stands for Store Set ID Table, and
|
|
* LFST is Last Fetched Store Table.
|
|
*/
|
|
class StoreSet
|
|
{
|
|
public:
|
|
typedef unsigned SSID;
|
|
|
|
public:
|
|
/** Default constructor. init() must be called prior to use. */
|
|
StoreSet() { };
|
|
|
|
/** Creates store set predictor with given table sizes. */
|
|
StoreSet(int SSIT_size, int LFST_size);
|
|
|
|
/** Default destructor. */
|
|
~StoreSet();
|
|
|
|
/** Initializes the store set predictor with the given table sizes. */
|
|
void init(int SSIT_size, int LFST_size);
|
|
|
|
/** Records a memory ordering violation between the younger load
|
|
* and the older store. */
|
|
void violation(Addr store_PC, Addr load_PC);
|
|
|
|
/** Inserts a load into the store set predictor. This does nothing but
|
|
* is included in case other predictors require a similar function.
|
|
*/
|
|
void insertLoad(Addr load_PC, InstSeqNum load_seq_num);
|
|
|
|
/** Inserts a store into the store set predictor. Updates the
|
|
* LFST if the store has a valid SSID. */
|
|
void insertStore(Addr store_PC, InstSeqNum store_seq_num,
|
|
unsigned tid);
|
|
|
|
/** Checks if the instruction with the given PC is dependent upon
|
|
* any store. @return Returns the sequence number of the store
|
|
* instruction this PC is dependent upon. Returns 0 if none.
|
|
*/
|
|
InstSeqNum checkInst(Addr PC);
|
|
|
|
/** Records this PC/sequence number as issued. */
|
|
void issued(Addr issued_PC, InstSeqNum issued_seq_num, bool is_store);
|
|
|
|
/** Squashes for a specific thread until the given sequence number. */
|
|
void squash(InstSeqNum squashed_num, unsigned tid);
|
|
|
|
/** Resets all tables. */
|
|
void clear();
|
|
|
|
/** Debug function to dump the contents of the store list. */
|
|
void dump();
|
|
|
|
private:
|
|
/** Calculates the index into the SSIT based on the PC. */
|
|
inline int calcIndex(Addr PC)
|
|
{ return (PC >> offsetBits) & indexMask; }
|
|
|
|
/** Calculates a Store Set ID based on the PC. */
|
|
inline SSID calcSSID(Addr PC)
|
|
{ return ((PC ^ (PC >> 10)) % LFSTSize); }
|
|
|
|
/** The Store Set ID Table. */
|
|
std::vector<SSID> SSIT;
|
|
|
|
/** Bit vector to tell if the SSIT has a valid entry. */
|
|
std::vector<bool> validSSIT;
|
|
|
|
/** Last Fetched Store Table. */
|
|
std::vector<InstSeqNum> LFST;
|
|
|
|
/** Bit vector to tell if the LFST has a valid entry. */
|
|
std::vector<bool> validLFST;
|
|
|
|
/** Map of stores that have been inserted into the store set, but
|
|
* not yet issued or squashed.
|
|
*/
|
|
std::map<InstSeqNum, int, ltseqnum> storeList;
|
|
|
|
typedef std::map<InstSeqNum, int, ltseqnum>::iterator SeqNumMapIt;
|
|
|
|
/** Store Set ID Table size, in entries. */
|
|
int SSITSize;
|
|
|
|
/** Last Fetched Store Table size, in entries. */
|
|
int LFSTSize;
|
|
|
|
/** Mask to obtain the index. */
|
|
int indexMask;
|
|
|
|
// HACK: Hardcoded for now.
|
|
int offsetBits;
|
|
};
|
|
|
|
#endif // __CPU_O3_STORE_SET_HH__
|