mem: Support WriteInvalidate (again)

This patch takes a clean-slate approach to providing WriteInvalidate
(write streaming, full cache line writes without first reading)
support.

Unlike the prior attempt, which took an aggressive approach of directly
writing into the cache before handling the coherence actions, this
approach follows the existing cache flows as closely as possible.
This commit is contained in:
Curtis Dunham 2014-12-02 06:08:19 -05:00
parent 7ca27dd3cc
commit 5d22250845
3 changed files with 85 additions and 35 deletions

View file

@ -379,6 +379,13 @@ AbstractMemory::access(PacketPtr pkt)
bytesRead[pkt->req->masterId()] += pkt->getSize(); bytesRead[pkt->req->masterId()] += pkt->getSize();
if (pkt->req->isInstFetch()) if (pkt->req->isInstFetch())
bytesInstRead[pkt->req->masterId()] += pkt->getSize(); bytesInstRead[pkt->req->masterId()] += pkt->getSize();
} else if (pkt->isInvalidate()) {
// no need to do anything
// this clause is intentionally before the write clause: the only
// transaction that is both a write and an invalidate is
// WriteInvalidate, and for the sake of consistency, it does not
// write to memory. in a cacheless system, there are no WriteInv's
// because the Write -> WriteInvalidate rewrite happens in the cache.
} else if (pkt->isWrite()) { } else if (pkt->isWrite()) {
if (writeOK(pkt)) { if (writeOK(pkt)) {
if (pmemAddr) { if (pmemAddr) {
@ -391,8 +398,6 @@ AbstractMemory::access(PacketPtr pkt)
numWrites[pkt->req->masterId()]++; numWrites[pkt->req->masterId()]++;
bytesWritten[pkt->req->masterId()] += pkt->getSize(); bytesWritten[pkt->req->masterId()] += pkt->getSize();
} }
} else if (pkt->isInvalidate()) {
// no need to do anything
} else { } else {
panic("unimplemented"); panic("unimplemented");
} }

View file

@ -70,7 +70,7 @@ Cache<TagStore>::Cache(const Params *p)
: BaseCache(p), : BaseCache(p),
tags(dynamic_cast<TagStore*>(p->tags)), tags(dynamic_cast<TagStore*>(p->tags)),
prefetcher(p->prefetcher), prefetcher(p->prefetcher),
doFastWrites(false), doFastWrites(true),
prefetchOnAccess(p->prefetch_on_access) prefetchOnAccess(p->prefetch_on_access)
{ {
tempBlock = new BlkType(); tempBlock = new BlkType();
@ -167,7 +167,10 @@ Cache<TagStore>::satisfyCpuSideRequest(PacketPtr pkt, BlkType *blk,
// isWrite() will be true for them // isWrite() will be true for them
if (pkt->cmd == MemCmd::SwapReq) { if (pkt->cmd == MemCmd::SwapReq) {
cmpAndSwap(blk, pkt); cmpAndSwap(blk, pkt);
} else if (pkt->isWrite()) { } else if (pkt->isWrite() &&
(!pkt->isWriteInvalidate() || isTopLevel)) {
assert(blk->isWritable());
// Write or WriteInvalidate at the first cache with block in Exclusive
if (blk->checkWrite(pkt)) { if (blk->checkWrite(pkt)) {
pkt->writeDataToBlock(blk->data, blkSize); pkt->writeDataToBlock(blk->data, blkSize);
} }
@ -176,6 +179,8 @@ Cache<TagStore>::satisfyCpuSideRequest(PacketPtr pkt, BlkType *blk,
// appended themselves to this cache before knowing the store // appended themselves to this cache before knowing the store
// will fail. // will fail.
blk->status |= BlkDirty; blk->status |= BlkDirty;
DPRINTF(Cache, "%s for %s address %x size %d (write)\n", __func__,
pkt->cmdString(), pkt->getAddr(), pkt->getSize());
} else if (pkt->isRead()) { } else if (pkt->isRead()) {
if (pkt->isLLSC()) { if (pkt->isLLSC()) {
blk->trackLoadLocked(pkt); blk->trackLoadLocked(pkt);
@ -229,13 +234,15 @@ Cache<TagStore>::satisfyCpuSideRequest(PacketPtr pkt, BlkType *blk,
} }
} }
} else { } else {
// Not a read or write... must be an upgrade. it's OK // Upgrade or WriteInvalidate at a different cache than received it.
// to just ack those as long as we have an exclusive // Since we have it Exclusively (E or M), we ack then invalidate.
// copy at this level. assert(pkt->isUpgrade() ||
assert(pkt->isUpgrade()); (pkt->isWriteInvalidate() && !isTopLevel));
assert(blk != tempBlock); assert(blk != tempBlock);
tags->invalidate(blk); tags->invalidate(blk);
blk->invalidate(); blk->invalidate();
DPRINTF(Cache, "%s for %s address %x size %d (invalidation)\n",
__func__, pkt->cmdString(), pkt->getAddr(), pkt->getSize());
} }
} }
@ -742,6 +749,8 @@ Cache<TagStore>::getBusPacket(PacketPtr cpu_pkt, BlkType *blk,
// where the determination the StoreCond fails is delayed due to // where the determination the StoreCond fails is delayed due to
// all caches not being on the same local bus. // all caches not being on the same local bus.
cmd = MemCmd::SCUpgradeFailReq; cmd = MemCmd::SCUpgradeFailReq;
} else if (cpu_pkt->isWriteInvalidate()) {
cmd = cpu_pkt->cmd;
} else { } else {
// block is invalid // block is invalid
cmd = needsExclusive ? MemCmd::ReadExReq : MemCmd::ReadReq; cmd = needsExclusive ? MemCmd::ReadExReq : MemCmd::ReadReq;
@ -843,6 +852,14 @@ Cache<TagStore>::recvAtomic(PacketPtr pkt)
if (bus_pkt->isError()) { if (bus_pkt->isError()) {
pkt->makeAtomicResponse(); pkt->makeAtomicResponse();
pkt->copyError(bus_pkt); pkt->copyError(bus_pkt);
} else if (pkt->isWriteInvalidate()) {
// note the use of pkt, not bus_pkt here.
if (isTopLevel) {
blk = handleFill(pkt, blk, writebacks);
satisfyCpuSideRequest(pkt, blk);
} else if (blk) {
satisfyCpuSideRequest(pkt, blk);
}
} else if (bus_pkt->isRead() || } else if (bus_pkt->isRead() ||
bus_pkt->cmd == MemCmd::UpgradeResp) { bus_pkt->cmd == MemCmd::UpgradeResp) {
// we're updating cache state to allow us to // we're updating cache state to allow us to
@ -1048,6 +1065,23 @@ Cache<TagStore>::recvTimingResp(PacketPtr pkt)
break; // skip response break; // skip response
} }
// unlike the other packet flows, where data is found in other
// caches or memory and brought back, write invalidates always
// have the data right away, so the above check for "is fill?"
// cannot actually be determined until examining the stored MSHR
// state. We "catch up" with that logic here, which is duplicated
// from above.
if (target->pkt->isWriteInvalidate() && isTopLevel) {
assert(!is_error);
// NB: we use the original packet here and not the response!
mshr->handleFill(target->pkt, blk);
blk = handleFill(target->pkt, blk, writebacks);
assert(blk != NULL);
is_fill = true;
}
if (is_fill) { if (is_fill) {
satisfyCpuSideRequest(target->pkt, blk, satisfyCpuSideRequest(target->pkt, blk,
true, mshr->hasPostDowngrade()); true, mshr->hasPostDowngrade());
@ -1138,7 +1172,8 @@ Cache<TagStore>::recvTimingResp(PacketPtr pkt)
} }
if (blk && blk->isValid()) { if (blk && blk->isValid()) {
if (pkt->isInvalidate() || mshr->hasPostInvalidate()) { if ((pkt->isInvalidate() || mshr->hasPostInvalidate()) &&
(!pkt->isWriteInvalidate() || !isTopLevel)) {
assert(blk != tempBlock); assert(blk != tempBlock);
tags->invalidate(blk); tags->invalidate(blk);
blk->invalidate(); blk->invalidate();
@ -1344,7 +1379,7 @@ typename Cache<TagStore>::BlkType*
Cache<TagStore>::handleFill(PacketPtr pkt, BlkType *blk, Cache<TagStore>::handleFill(PacketPtr pkt, BlkType *blk,
PacketList &writebacks) PacketList &writebacks)
{ {
assert(pkt->isResponse()); assert(pkt->isResponse() || pkt->isWriteInvalidate());
Addr addr = pkt->getAddr(); Addr addr = pkt->getAddr();
bool is_secure = pkt->isSecure(); bool is_secure = pkt->isSecure();
#if TRACING_ON #if TRACING_ON
@ -1355,8 +1390,10 @@ Cache<TagStore>::handleFill(PacketPtr pkt, BlkType *blk,
// better have read new data... // better have read new data...
assert(pkt->hasData()); assert(pkt->hasData());
// only read reaponses have data // only read responses and (original) write invalidate req's have data;
assert(pkt->isRead()); // note that we don't write the data here for write invalidate - that
// happens in the subsequent satisfyCpuSideRequest.
assert(pkt->isRead() || pkt->isWriteInvalidate());
// need to do a replacement // need to do a replacement
blk = allocateBlock(addr, is_secure, writebacks); blk = allocateBlock(addr, is_secure, writebacks);
@ -1539,8 +1576,13 @@ Cache<TagStore>::handleSnoop(PacketPtr pkt, BlkType *blk,
// we may end up modifying both the block state and the packet (if // we may end up modifying both the block state and the packet (if
// we respond in atomic mode), so just figure out what to do now // we respond in atomic mode), so just figure out what to do now
// and then do it later. // and then do it later. If we find dirty data while snooping for a
bool respond = blk->isDirty() && pkt->needsResponse(); // WriteInvalidate, we don't care, since no merging needs to take place.
// We need the eviction to happen as normal, but the data needn't be
// sent anywhere. nor should the writeback be inhibited at the memory
// controller for any reason.
bool respond = blk->isDirty() && pkt->needsResponse()
&& !pkt->isWriteInvalidate();
bool have_exclusive = blk->isWritable(); bool have_exclusive = blk->isWritable();
// Invalidate any prefetch's from below that would strip write permissions // Invalidate any prefetch's from below that would strip write permissions

View file

@ -177,14 +177,16 @@ class MemCmd
public: public:
bool isRead() const { return testCmdAttrib(IsRead); } bool isRead() const { return testCmdAttrib(IsRead); }
bool isWrite() const { return testCmdAttrib(IsWrite); } bool isWrite() const { return testCmdAttrib(IsWrite); }
bool isUpgrade() const { return testCmdAttrib(IsUpgrade); } bool isUpgrade() const { return testCmdAttrib(IsUpgrade); }
bool isRequest() const { return testCmdAttrib(IsRequest); } bool isRequest() const { return testCmdAttrib(IsRequest); }
bool isResponse() const { return testCmdAttrib(IsResponse); } bool isResponse() const { return testCmdAttrib(IsResponse); }
bool needsExclusive() const { return testCmdAttrib(NeedsExclusive); } bool needsExclusive() const { return testCmdAttrib(NeedsExclusive); }
bool needsResponse() const { return testCmdAttrib(NeedsResponse); } bool needsResponse() const { return testCmdAttrib(NeedsResponse); }
bool isInvalidate() const { return testCmdAttrib(IsInvalidate); } bool isInvalidate() const { return testCmdAttrib(IsInvalidate); }
bool isWriteInvalidate() const { return testCmdAttrib(IsWrite) &&
testCmdAttrib(IsInvalidate); }
/** /**
* Check if this particular packet type carries payload data. Note * Check if this particular packet type carries payload data. Note
@ -495,19 +497,20 @@ class Packet : public Printable
/// Return the index of this command. /// Return the index of this command.
inline int cmdToIndex() const { return cmd.toInt(); } inline int cmdToIndex() const { return cmd.toInt(); }
bool isRead() const { return cmd.isRead(); } bool isRead() const { return cmd.isRead(); }
bool isWrite() const { return cmd.isWrite(); } bool isWrite() const { return cmd.isWrite(); }
bool isUpgrade() const { return cmd.isUpgrade(); } bool isUpgrade() const { return cmd.isUpgrade(); }
bool isRequest() const { return cmd.isRequest(); } bool isRequest() const { return cmd.isRequest(); }
bool isResponse() const { return cmd.isResponse(); } bool isResponse() const { return cmd.isResponse(); }
bool needsExclusive() const { return cmd.needsExclusive(); } bool needsExclusive() const { return cmd.needsExclusive(); }
bool needsResponse() const { return cmd.needsResponse(); } bool needsResponse() const { return cmd.needsResponse(); }
bool isInvalidate() const { return cmd.isInvalidate(); } bool isInvalidate() const { return cmd.isInvalidate(); }
bool hasData() const { return cmd.hasData(); } bool isWriteInvalidate() const { return cmd.isWriteInvalidate(); }
bool isLLSC() const { return cmd.isLLSC(); } bool hasData() const { return cmd.hasData(); }
bool isError() const { return cmd.isError(); } bool isLLSC() const { return cmd.isLLSC(); }
bool isPrint() const { return cmd.isPrint(); } bool isError() const { return cmd.isError(); }
bool isFlush() const { return cmd.isFlush(); } bool isPrint() const { return cmd.isPrint(); }
bool isFlush() const { return cmd.isFlush(); }
// Snoop flags // Snoop flags
void assertMemInhibit() void assertMemInhibit()