diff options
author | Andreas Hansson <andreas.hansson@arm.com> | 2015-07-03 10:14:45 -0400 |
---|---|---|
committer | Andreas Hansson <andreas.hansson@arm.com> | 2015-07-03 10:14:45 -0400 |
commit | b56167b68214581857ffae5c25f7945d75cee6b3 (patch) | |
tree | c0d9d30d659a8e8bd6d27b9a4bcbd4438e413025 /src | |
parent | db85ddca1a3c81fb7c513216fa08bb1f6dd580b7 (diff) | |
download | gem5-b56167b68214581857ffae5c25f7945d75cee6b3.tar.xz |
mem: Avoid DRAM write queue iteration for merging and read lookup
This patch adds a simple lookup structure to avoid iterating over the
write queue to find read matches, and for the merging of write
bursts. Instead of relying on iteration we simply store a set of
currently-buffered write-burst addresses and compare against
these. For the reads we still perform the iteration if we have a
match. For the writes, we rely entirely on the set. Note that there
are corner-cases where sub-bursts would actually not be mergeable
without a read-modify-write. We ignore these cases and opt for speed.
Diffstat (limited to 'src')
-rw-r--r-- | src/mem/dram_ctrl.cc | 98 | ||||
-rw-r--r-- | src/mem/dram_ctrl.hh | 21 |
2 files changed, 48 insertions, 71 deletions
diff --git a/src/mem/dram_ctrl.cc b/src/mem/dram_ctrl.cc index 196f599af..3a4778978 100644 --- a/src/mem/dram_ctrl.cc +++ b/src/mem/dram_ctrl.cc @@ -1,5 +1,5 @@ /* - * Copyright (c) 2010-2014 ARM Limited + * Copyright (c) 2010-2015 ARM Limited * All rights reserved * * The license below extends only to copyright in the software and shall @@ -97,6 +97,9 @@ DRAMCtrl::DRAMCtrl(const DRAMCtrlParams* p) : fatal_if(!isPowerOf2(ranksPerChannel), "DRAM rank count of %d is not " "allowed, must be a power of two\n", ranksPerChannel); + fatal_if(!isPowerOf2(burstSize), "DRAM burst size %d is not allowed, " + "must be a power of two\n", burstSize); + for (int i = 0; i < ranksPerChannel; i++) { Rank* rank = new Rank(*this, p); ranks.push_back(rank); @@ -438,18 +441,22 @@ DRAMCtrl::addToReadQueue(PacketPtr pkt, unsigned int pktCount) // First check write buffer to see if the data is already at // the controller bool foundInWrQ = false; - for (auto i = writeQueue.begin(); i != writeQueue.end(); ++i) { - // check if the read is subsumed in the write entry we are - // looking at - if ((*i)->addr <= addr && - (addr + size) <= ((*i)->addr + (*i)->size)) { - foundInWrQ = true; - servicedByWrQ++; - pktsServicedByWrQ++; - DPRINTF(DRAM, "Read to addr %lld with size %d serviced by " - "write queue\n", addr, size); - bytesReadWrQ += burstSize; - break; + Addr burst_addr = burstAlign(addr); + // if the burst address is not present then there is no need + // looking any further + if (isInWriteQueue.find(burst_addr) != isInWriteQueue.end()) { + for (const auto& p : writeQueue) { + // check if the read is subsumed in the write queue + // packet we are looking at + if (p->addr <= addr && (addr + size) <= (p->addr + p->size)) { + foundInWrQ = true; + servicedByWrQ++; + pktsServicedByWrQ++; + DPRINTF(DRAM, "Read to addr %lld with size %d serviced by " + "write queue\n", addr, size); + bytesReadWrQ += burstSize; + break; + } } } @@ -517,63 +524,9 @@ DRAMCtrl::addToWriteQueue(PacketPtr pkt, unsigned int pktCount) writeBursts++; // see if we can merge with an existing item in the write - // queue and keep track of whether we have merged or not so we - // can stop at that point and also avoid enqueueing a new - // request - bool merged = false; - auto w = writeQueue.begin(); - - while(!merged && w != writeQueue.end()) { - // either of the two could be first, if they are the same - // it does not matter which way we go - if ((*w)->addr >= addr) { - // the existing one starts after the new one, figure - // out where the new one ends with respect to the - // existing one - if ((addr + size) >= ((*w)->addr + (*w)->size)) { - // check if the existing one is completely - // subsumed in the new one - DPRINTF(DRAM, "Merging write covering existing burst\n"); - merged = true; - // update both the address and the size - (*w)->addr = addr; - (*w)->size = size; - } else if ((addr + size) >= (*w)->addr && - ((*w)->addr + (*w)->size - addr) <= burstSize) { - // the new one is just before or partially - // overlapping with the existing one, and together - // they fit within a burst - DPRINTF(DRAM, "Merging write before existing burst\n"); - merged = true; - // the existing queue item needs to be adjusted with - // respect to both address and size - (*w)->size = (*w)->addr + (*w)->size - addr; - (*w)->addr = addr; - } - } else { - // the new one starts after the current one, figure - // out where the existing one ends with respect to the - // new one - if (((*w)->addr + (*w)->size) >= (addr + size)) { - // check if the new one is completely subsumed in the - // existing one - DPRINTF(DRAM, "Merging write into existing burst\n"); - merged = true; - // no adjustments necessary - } else if (((*w)->addr + (*w)->size) >= addr && - (addr + size - (*w)->addr) <= burstSize) { - // the existing one is just before or partially - // overlapping with the new one, and together - // they fit within a burst - DPRINTF(DRAM, "Merging write after existing burst\n"); - merged = true; - // the address is right, and only the size has - // to be adjusted - (*w)->size = addr + size - (*w)->addr; - } - } - ++w; - } + // queue and keep track of whether we have merged or not + bool merged = isInWriteQueue.find(burstAlign(addr)) != + isInWriteQueue.end(); // if the item was not merged we need to create a new write // and enqueue it @@ -586,10 +539,14 @@ DRAMCtrl::addToWriteQueue(PacketPtr pkt, unsigned int pktCount) DPRINTF(DRAM, "Adding to write queue\n"); writeQueue.push_back(dram_pkt); + isInWriteQueue.insert(burstAlign(addr)); + assert(writeQueue.size() == isInWriteQueue.size()); // Update stats avgWrQLen = writeQueue.size(); } else { + DPRINTF(DRAM, "Merging write burst with existing queue entry\n"); + // keep track of the fact that this burst effectively // disappeared as it was merged with an existing one mergedWrBursts++; @@ -1418,6 +1375,7 @@ DRAMCtrl::processNextReqEvent() doDRAMAccess(dram_pkt); writeQueue.pop_front(); + isInWriteQueue.erase(burstAlign(dram_pkt->addr)); delete dram_pkt; // If we emptied the write queue, or got sufficiently below the diff --git a/src/mem/dram_ctrl.hh b/src/mem/dram_ctrl.hh index 3caaff959..57731f5e0 100644 --- a/src/mem/dram_ctrl.hh +++ b/src/mem/dram_ctrl.hh @@ -1,5 +1,5 @@ /* - * Copyright (c) 2012-2014 ARM Limited + * Copyright (c) 2012-2015 ARM Limited * All rights reserved * * The license below extends only to copyright in the software and shall @@ -53,6 +53,7 @@ #include <deque> #include <string> +#include <unordered_set> #include "base/statistics.hh" #include "enums/AddrMap.hh" @@ -637,12 +638,30 @@ class DRAMCtrl : public AbstractMemory void printQs() const; /** + * Burst-align an address. + * + * @param addr The potentially unaligned address + * + * @return An address aligned to a DRAM burst + */ + Addr burstAlign(Addr addr) const { return (addr & ~(Addr(burstSize - 1))); } + + /** * The controller's main read and write queues */ std::deque<DRAMPacket*> readQueue; std::deque<DRAMPacket*> writeQueue; /** + * To avoid iterating over the write queue to check for + * overlapping transactions, maintain a set of burst addresses + * that are currently queued. Since we merge writes to the same + * location we never have more than one address to the same burst + * address. + */ + std::unordered_set<Addr> isInWriteQueue; + + /** * Response queue where read packets wait after we're done working * with them, but it's not time to send the response yet. The * responses are stored seperately mostly to keep the code clean |