summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--src/cpu/o3/inst_queue_impl.hh4
-rw-r--r--src/cpu/o3/lsq_unit_impl.hh7
-rw-r--r--src/cpu/o3/rob_impl.hh1
-rw-r--r--src/mem/protocol/MESI_Two_Level-L1cache.sm2
-rw-r--r--src/mem/ruby/system/Sequencer.cc14
-rw-r--r--src/mem/ruby/system/Sequencer.hh1
6 files changed, 14 insertions, 15 deletions
diff --git a/src/cpu/o3/inst_queue_impl.hh b/src/cpu/o3/inst_queue_impl.hh
index 0a6d309fe..a30bf7f5f 100644
--- a/src/cpu/o3/inst_queue_impl.hh
+++ b/src/cpu/o3/inst_queue_impl.hh
@@ -1182,8 +1182,12 @@ InstructionQueue<Impl>::getDeferredMemInstToExecute()
// 2. virtual fence ahead
// 3. not ready to expose and gets a TLB miss
// for both (2, 3) we need to restart the translation
+
+ DPRINTF(IQ, "sn:%lli onlyWaitForFence = %d, fenceDelay = %d\n", (*it)->seqNum, (*it)->onlyWaitForFence(), (*it)->fenceDelay() );
+
if ( (*it)->translationCompleted()
|| ((*it)->onlyWaitForFence() && !(*it)->fenceDelay())
+ || ((*it)->onlyWaitForExpose() && (*it)->readyToExpose())
|| (*it)->isSquashed()) {
DynInstPtr mem_inst = std::move(*it);
mem_inst->onlyWaitForFence(false);
diff --git a/src/cpu/o3/lsq_unit_impl.hh b/src/cpu/o3/lsq_unit_impl.hh
index ebc963d5b..80445e261 100644
--- a/src/cpu/o3/lsq_unit_impl.hh
+++ b/src/cpu/o3/lsq_unit_impl.hh
@@ -128,6 +128,8 @@ LSQUnit<Impl>::completeDataAccess(PacketPtr pkt)
DPRINTF(LSQUnit, "spec load miss for inst [sn:%lli], fence it.\n",
inst->seqNum);
inst->fenceDelay(true);
+ } else {
+ DPRINTF(LSQUnit, "spec load hit for inst [sn:%lli].\n");
}
assert(!cpu->switchedOut());
@@ -918,6 +920,7 @@ LSQUnit<Impl>::updateVisibleState()
//iterate all the loads and update its fencedelay state accordingly
while (load_idx != loadTail && loadQueue[load_idx]){
DynInstPtr inst = loadQueue[load_idx];
+ DPRINTF(LSQUnit, "update visible state for inst [sn:%lli].\n", inst->seqNum);
if (!loadInExec){
@@ -981,6 +984,7 @@ LSQUnit<Impl>::updateVisibleState()
assert(0);
//--loadsToVLD;
}
+ DPRINTF(LSQUnit, "inst [sn:%lli] not ready to expose.\n", inst->seqNum);
inst->readyToExpose(false);
} else {
/* set taint for dst registers */
@@ -1370,7 +1374,10 @@ LSQUnit<Impl>::writeback(const DynInstPtr &inst, PacketPtr pkt)
if (inst->fenceDelay()) {
DPRINTF(LSQUnit, "To write back a fence delayed spec load [sn:%lli].\n", inst->seqNum);
+ assert(pkt->isSpec());
inst->onlyWaitForFence(true);
+ inst->translationStarted(false);
+ inst->translationCompleted(false);
iewStage->instQueue.deferMemInst(inst);
} else if (!inst->isExecuted()) {
inst->setExecuted();
diff --git a/src/cpu/o3/rob_impl.hh b/src/cpu/o3/rob_impl.hh
index b729a9d00..32cfe04a1 100644
--- a/src/cpu/o3/rob_impl.hh
+++ b/src/cpu/o3/rob_impl.hh
@@ -434,6 +434,7 @@ ROB<Impl>::updateVisibleState()
while (inst_it != tail_inst_it) {
DynInstPtr inst = *inst_it++;
+ DPRINTF(ROB, "updating rob visible state for [sn:%lli]\n", inst->seqNum);
assert(inst!=0);
diff --git a/src/mem/protocol/MESI_Two_Level-L1cache.sm b/src/mem/protocol/MESI_Two_Level-L1cache.sm
index 8496fda61..e925057db 100644
--- a/src/mem/protocol/MESI_Two_Level-L1cache.sm
+++ b/src/mem/protocol/MESI_Two_Level-L1cache.sm
@@ -1227,7 +1227,7 @@ machine(MachineType:L1Cache, "MESI Directory L1 Cache CMP")
k_popMandatoryQueue;
}
- transition({NP,I}, SpecLoad, IX) {
+ transition({NP,I}, SpecLoad) {
h_spec_load_miss;
k_popMandatoryQueue;
}
diff --git a/src/mem/ruby/system/Sequencer.cc b/src/mem/ruby/system/Sequencer.cc
index 090030f08..a0d3cab1b 100644
--- a/src/mem/ruby/system/Sequencer.cc
+++ b/src/mem/ruby/system/Sequencer.cc
@@ -237,16 +237,6 @@ Sequencer::insertRequest(PacketPtr pkt, RubyRequestType request_type)
RequestTable::iterator i = r.first;
i->second = new SequencerRequest(pkt, request_type, curCycle());
m_outstanding_count++;
- } else if (request_type == RubyRequestType_SPEC_LD) {
- auto i = m_readRequestTable.find(line_addr);
- if (i->second->m_type == RubyRequestType_SPEC_LD) {
- DPRINTFR(SpecBuffer, "%10s Merging (idx=%d-%d, addr=%#x) with %d\n", curTick(), pkt->reqIdx, pkt->isFirst()? 0 : 1, printAddress(pkt->getAddr()), i->second->pkt->reqIdx);
- i->second->dependentSpecRequests.push_back(pkt);
- return RequestStatus_Merged;
- } else {
- m_load_waiting_on_load++;
- return RequestStatus_Aliased;
- }
} else {
// There is an outstanding read request for the cache line
m_load_waiting_on_load++;
@@ -653,9 +643,7 @@ Sequencer::makeRequest(PacketPtr pkt)
}
RequestStatus status = insertRequest(pkt, primary_type);
- if (status == RequestStatus_Merged) {
- return RequestStatus_Issued;
- } else if (status != RequestStatus_Ready) {
+ if (status != RequestStatus_Ready) {
return status;
}
diff --git a/src/mem/ruby/system/Sequencer.hh b/src/mem/ruby/system/Sequencer.hh
index 8e1f08a48..d9ed62320 100644
--- a/src/mem/ruby/system/Sequencer.hh
+++ b/src/mem/ruby/system/Sequencer.hh
@@ -46,7 +46,6 @@ struct SequencerRequest
PacketPtr pkt;
RubyRequestType m_type;
Cycles issue_time;
- std::vector<PacketPtr> dependentSpecRequests;
SequencerRequest(PacketPtr _pkt, RubyRequestType _m_type,
Cycles _issue_time)