src/mem/ruby/system/Sequencer.cc

   1 /*
   2  * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood
   3  * All rights reserved.
   4  *
   5  * Redistribution and use in source and binary forms, with or without
   6  * modification, are permitted provided that the following conditions are
   7  * met: redistributions of source code must retain the above copyright
   8  * notice, this list of conditions and the following disclaimer;
   9  * redistributions in binary form must reproduce the above copyright
  10  * notice, this list of conditions and the following disclaimer in the
  11  * documentation and/or other materials provided with the distribution;
  12  * neither the name of the copyright holders nor the names of its
  13  * contributors may be used to endorse or promote products derived from
  14  * this software without specific prior written permission.
  15  *
  16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  17  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  18  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  19  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  20  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  21  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  22  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  23  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  24  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  25  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  26  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  27  */
  28
  29 #include "mem/ruby/system/Sequencer.hh"
  30
  31 #include "arch/x86/ldstflags.hh"
  32 #include "base/misc.hh"
  33 #include "base/str.hh"
  34 #include "cpu/testers/rubytest/RubyTester.hh"
  35 #include "debug/MemoryAccess.hh"
  36 #include "debug/ProtocolTrace.hh"
  37 #include "debug/RubySequencer.hh"
  38 #include "debug/RubyStats.hh"
  39 #include "mem/packet.hh"
  40 #include "mem/protocol/PrefetchBit.hh"
  41 #include "mem/protocol/RubyAccessMode.hh"
  42 #include "mem/ruby/profiler/Profiler.hh"
  43 #include "mem/ruby/slicc_interface/RubyRequest.hh"
  44 #include "mem/ruby/system/RubySystem.hh"
  45 #include "sim/system.hh"
  46
  47 using namespace std;
  48
  49 Sequencer *
  50 RubySequencerParams::create()
  51 {
  52     return new Sequencer(this);
  53 }
  54
  55 Sequencer::Sequencer(const Params *p)
  56     : RubyPort(p), m_IncompleteTimes(MachineType_NUM), deadlockCheckEvent(this)
  57 {
  58     m_outstanding_count = 0;
  59
  60     m_instCache_ptr = p->icache;
  61     m_dataCache_ptr = p->dcache;
  62     m_data_cache_hit_latency = p->dcache_hit_latency;
  63     m_inst_cache_hit_latency = p->icache_hit_latency;
  64     m_max_outstanding_requests = p->max_outstanding_requests;
  65     m_deadlock_threshold = p->deadlock_threshold;
  66
  67     m_coreId = p->coreid; // for tracking the two CorePair sequencers
  68     assert(m_max_outstanding_requests > 0);
  69     assert(m_deadlock_threshold > 0);
  70     assert(m_instCache_ptr != NULL);
  71     assert(m_dataCache_ptr != NULL);
  72     assert(m_data_cache_hit_latency > 0);
  73     assert(m_inst_cache_hit_latency > 0);
  74
  75     m_runningGarnetStandalone = p->garnet_standalone;
  76 }
  77
  78 Sequencer::~Sequencer()
  79 {
  80 }
  81
  82 void
  83 Sequencer::wakeup()
  84 {
  85     assert(drainState() != DrainState::Draining);
  86
  87     // Check for deadlock of any of the requests
  88     Cycles current_time = curCycle();
  89
  90     // Check across all outstanding requests
  91     int total_outstanding = 0;
  92
  93     RequestTable::iterator read = m_readRequestTable.begin();
  94     RequestTable::iterator read_end = m_readRequestTable.end();
  95     for (; read != read_end; ++read) {
  96         SequencerRequest* request = read->second;
  97         if (current_time - request->issue_time < m_deadlock_threshold)
  98             continue;
  99
 100         panic("Possible Deadlock detected. Aborting!\n"
 101               "version: %d request.paddr: 0x%x m_readRequestTable: %d "
 102               "current time: %u issue_time: %d difference: %d\n", m_version,
 103               request->pkt->getAddr(), m_readRequestTable.size(),
 104               current_time * clockPeriod(), request->issue_time * clockPeriod(),
 105               (current_time * clockPeriod()) - (request->issue_time * clockPeriod()));
 106     }
 107
 108     RequestTable::iterator write = m_writeRequestTable.begin();
 109     RequestTable::iterator write_end = m_writeRequestTable.end();
 110     for (; write != write_end; ++write) {
 111         SequencerRequest* request = write->second;
 112         if (current_time - request->issue_time < m_deadlock_threshold)
 113             continue;
 114
 115         panic("Possible Deadlock detected. Aborting!\n"
 116               "version: %d request.paddr: 0x%x m_writeRequestTable: %d "
 117               "current time: %u issue_time: %d difference: %d\n", m_version,
 118               request->pkt->getAddr(), m_writeRequestTable.size(),
 119               current_time * clockPeriod(), request->issue_time * clockPeriod(),
 120               (current_time * clockPeriod()) - (request->issue_time * clockPeriod()));
 121     }
 122
 123     total_outstanding += m_writeRequestTable.size();
 124     total_outstanding += m_readRequestTable.size();
 125
 126     assert(m_outstanding_count == total_outstanding);
 127
 128     if (m_outstanding_count > 0) {
 129         // If there are still outstanding requests, keep checking
 130         schedule(deadlockCheckEvent, clockEdge(m_deadlock_threshold));
 131     }
 132 }
 133
 134 void Sequencer::resetStats()
 135 {
 136     m_latencyHist.reset();
 137     m_hitLatencyHist.reset();
 138     m_missLatencyHist.reset();
 139     for (int i = 0; i < RubyRequestType_NUM; i++) {
 140         m_typeLatencyHist[i]->reset();
 141         m_hitTypeLatencyHist[i]->reset();
 142         m_missTypeLatencyHist[i]->reset();
 143         for (int j = 0; j < MachineType_NUM; j++) {
 144             m_hitTypeMachLatencyHist[i][j]->reset();
 145             m_missTypeMachLatencyHist[i][j]->reset();
 146         }
 147     }
 148
 149     for (int i = 0; i < MachineType_NUM; i++) {
 150         m_missMachLatencyHist[i]->reset();
 151         m_hitMachLatencyHist[i]->reset();
 152
 153         m_IssueToInitialDelayHist[i]->reset();
 154         m_InitialToForwardDelayHist[i]->reset();
 155         m_ForwardToFirstResponseDelayHist[i]->reset();
 156         m_FirstResponseToCompletionDelayHist[i]->reset();
 157
 158         m_IncompleteTimes[i] = 0;
 159     }
 160 }
 161
 162 // Insert the request on the correct request table.  Return true if
 163 // the entry was already present.
 164 RequestStatus
 165 Sequencer::insertRequest(PacketPtr pkt, RubyRequestType request_type)
 166 {
 167     assert(m_outstanding_count ==
 168         (m_writeRequestTable.size() + m_readRequestTable.size()));
 169
 170     // See if we should schedule a deadlock check
 171     if (!deadlockCheckEvent.scheduled() &&
 172         drainState() != DrainState::Draining) {
 173         schedule(deadlockCheckEvent, clockEdge(m_deadlock_threshold));
 174     }
 175
 176     Addr line_addr = makeLineAddress(pkt->getAddr());
 177
 178     // Check if the line is blocked for a Locked_RMW
 179     if (m_controller->isBlocked(line_addr) &&
 180         (request_type != RubyRequestType_Locked_RMW_Write)) {
 181         // Return that this request's cache line address aliases with
 182         // a prior request that locked the cache line. The request cannot
 183         // proceed until the cache line is unlocked by a Locked_RMW_Write
 184         return RequestStatus_Aliased;
 185     }
 186
 187     // Create a default entry, mapping the address to NULL, the cast is
 188     // there to make gcc 4.4 happy
 189     RequestTable::value_type default_entry(line_addr,
 190                                            (SequencerRequest*) NULL);
 191
 192     if ((request_type == RubyRequestType_ST) ||
 193         (request_type == RubyRequestType_RMW_Read) ||
 194         (request_type == RubyRequestType_RMW_Write) ||
 195         (request_type == RubyRequestType_Load_Linked) ||
 196         (request_type == RubyRequestType_Store_Conditional) ||
 197         (request_type == RubyRequestType_Locked_RMW_Read) ||
 198         (request_type == RubyRequestType_Locked_RMW_Write) ||
 199         (request_type == RubyRequestType_FLUSH)) {
 200
 201         // Check if there is any outstanding read request for the same
 202         // cache line.
 203         if (m_readRequestTable.count(line_addr) > 0) {
 204             m_store_waiting_on_load++;
 205             return RequestStatus_Aliased;
 206         }
 207
 208         pair<RequestTable::iterator, bool> r =
 209             m_writeRequestTable.insert(default_entry);
 210         if (r.second) {
 211             RequestTable::iterator i = r.first;
 212             i->second = new SequencerRequest(pkt, request_type, curCycle());
 213             m_outstanding_count++;
 214         } else {
 215           // There is an outstanding write request for the cache line
 216           m_store_waiting_on_store++;
 217           return RequestStatus_Aliased;
 218         }
 219     } else {
 220         // Check if there is any outstanding write request for the same
 221         // cache line.
 222         if (m_writeRequestTable.count(line_addr) > 0) {
 223             m_load_waiting_on_store++;
 224             return RequestStatus_Aliased;
 225         }
 226
 227         pair<RequestTable::iterator, bool> r =
 228             m_readRequestTable.insert(default_entry);
 229
 230         if (r.second) {
 231             RequestTable::iterator i = r.first;
 232             i->second = new SequencerRequest(pkt, request_type, curCycle());
 233             m_outstanding_count++;
 234         } else {
 235             // There is an outstanding read request for the cache line
 236             m_load_waiting_on_load++;
 237             return RequestStatus_Aliased;
 238         }
 239     }
 240
 241     m_outstandReqHist.sample(m_outstanding_count);
 242     assert(m_outstanding_count ==
 243         (m_writeRequestTable.size() + m_readRequestTable.size()));
 244
 245     return RequestStatus_Ready;
 246 }
 247
 248 void
 249 Sequencer::markRemoved()
 250 {
 251     m_outstanding_count--;
 252     assert(m_outstanding_count ==
 253            m_writeRequestTable.size() + m_readRequestTable.size());
 254 }
 255
 256 void
 257 Sequencer::invalidateSC(Addr address)
 258 {
 259     AbstractCacheEntry *e = m_dataCache_ptr->lookup(address);
 260     // The controller has lost the coherence permissions, hence the lock
 261     // on the cache line maintained by the cache should be cleared.
 262     if (e && e->isLocked(m_version)) {
 263         e->clearLocked();
 264     }
 265 }
 266
 267 bool
 268 Sequencer::handleLlsc(Addr address, SequencerRequest* request)
 269 {
 270     AbstractCacheEntry *e = m_dataCache_ptr->lookup(address);
 271     if (!e)
 272         return true;
 273
 274     // The success flag indicates whether the LLSC operation was successful.
 275     // LL ops will always succeed, but SC may fail if the cache line is no
 276     // longer locked.
 277     bool success = true;
 278     if (request->m_type == RubyRequestType_Store_Conditional) {
 279         if (!e->isLocked(m_version)) {
 280             //
 281             // For failed SC requests, indicate the failure to the cpu by
 282             // setting the extra data to zero.
 283             //
 284             request->pkt->req->setExtraData(0);
 285             success = false;
 286         } else {
 287             //
 288             // For successful SC requests, indicate the success to the cpu by
 289             // setting the extra data to one.
 290             //
 291             request->pkt->req->setExtraData(1);
 292         }
 293         //
 294         // Independent of success, all SC operations must clear the lock
 295         //
 296         e->clearLocked();
 297     } else if (request->m_type == RubyRequestType_Load_Linked) {
 298         //
 299         // Note: To fully follow Alpha LLSC semantics, should the LL clear any
 300         // previously locked cache lines?
 301         //
 302         e->setLocked(m_version);
 303     } else if (e->isLocked(m_version)) {
 304         //
 305         // Normal writes should clear the locked address
 306         //
 307         e->clearLocked();
 308     }
 309     return success;
 310 }
 311
 312 void
 313 Sequencer::recordMissLatency(const Cycles cycles, const RubyRequestType type,
 314                              const MachineType respondingMach,
 315                              bool isExternalHit, Cycles issuedTime,
 316                              Cycles initialRequestTime,
 317                              Cycles forwardRequestTime,
 318                              Cycles firstResponseTime, Cycles completionTime)
 319 {
 320     m_latencyHist.sample(cycles);
 321     m_typeLatencyHist[type]->sample(cycles);
 322
 323     if (isExternalHit) {
 324         m_missLatencyHist.sample(cycles);
 325         m_missTypeLatencyHist[type]->sample(cycles);
 326
 327         if (respondingMach != MachineType_NUM) {
 328             m_missMachLatencyHist[respondingMach]->sample(cycles);
 329             m_missTypeMachLatencyHist[type][respondingMach]->sample(cycles);
 330
 331             if ((issuedTime <= initialRequestTime) &&
 332                 (initialRequestTime <= forwardRequestTime) &&
 333                 (forwardRequestTime <= firstResponseTime) &&
 334                 (firstResponseTime <= completionTime)) {
 335
 336                 m_IssueToInitialDelayHist[respondingMach]->sample(
 337                     initialRequestTime - issuedTime);
 338                 m_InitialToForwardDelayHist[respondingMach]->sample(
 339                     forwardRequestTime - initialRequestTime);
 340                 m_ForwardToFirstResponseDelayHist[respondingMach]->sample(
 341                     firstResponseTime - forwardRequestTime);
 342                 m_FirstResponseToCompletionDelayHist[respondingMach]->sample(
 343                     completionTime - firstResponseTime);
 344             } else {
 345                 m_IncompleteTimes[respondingMach]++;
 346             }
 347         }
 348     } else {
 349         m_hitLatencyHist.sample(cycles);
 350         m_hitTypeLatencyHist[type]->sample(cycles);
 351
 352         if (respondingMach != MachineType_NUM) {
 353             m_hitMachLatencyHist[respondingMach]->sample(cycles);
 354             m_hitTypeMachLatencyHist[type][respondingMach]->sample(cycles);
 355         }
 356     }
 357 }
 358
 359 void
 360 Sequencer::writeCallback(Addr address, DataBlock& data,
 361                          const bool externalHit, const MachineType mach,
 362                          const Cycles initialRequestTime,
 363                          const Cycles forwardRequestTime,
 364                          const Cycles firstResponseTime)
 365 {
 366     assert(address == makeLineAddress(address));
 367     assert(m_writeRequestTable.count(makeLineAddress(address)));
 368
 369     RequestTable::iterator i = m_writeRequestTable.find(address);
 370     assert(i != m_writeRequestTable.end());
 371     SequencerRequest* request = i->second;
 372
 373     m_writeRequestTable.erase(i);
 374     markRemoved();
 375
 376     assert((request->m_type == RubyRequestType_ST) ||
 377            (request->m_type == RubyRequestType_ATOMIC) ||
 378            (request->m_type == RubyRequestType_RMW_Read) ||
 379            (request->m_type == RubyRequestType_RMW_Write) ||
 380            (request->m_type == RubyRequestType_Load_Linked) ||
 381            (request->m_type == RubyRequestType_Store_Conditional) ||
 382            (request->m_type == RubyRequestType_Locked_RMW_Read) ||
 383            (request->m_type == RubyRequestType_Locked_RMW_Write) ||
 384            (request->m_type == RubyRequestType_FLUSH));
 385
 386     //
 387     // For Alpha, properly handle LL, SC, and write requests with respect to
 388     // locked cache blocks.
 389     //
 390     // Not valid for Garnet_standalone protocl
 391     //
 392     bool success = true;
 393     if (!m_runningGarnetStandalone)
 394         success = handleLlsc(address, request);
 395
 396     // Handle SLICC block_on behavior for Locked_RMW accesses. NOTE: the
 397     // address variable here is assumed to be a line address, so when
 398     // blocking buffers, must check line addresses.
 399     if (request->m_type == RubyRequestType_Locked_RMW_Read) {
 400         // blockOnQueue blocks all first-level cache controller queues
 401         // waiting on memory accesses for the specified address that go to
 402         // the specified queue. In this case, a Locked_RMW_Write must go to
 403         // the mandatory_q before unblocking the first-level controller.
 404         // This will block standard loads, stores, ifetches, etc.
 405         m_controller->blockOnQueue(address, m_mandatory_q_ptr);
 406     } else if (request->m_type == RubyRequestType_Locked_RMW_Write) {
 407         m_controller->unblock(address);
 408     }
 409
 410     hitCallback(request, data, success, mach, externalHit,
 411                 initialRequestTime, forwardRequestTime, firstResponseTime);
 412 }
 413
 414 void
 415 Sequencer::readCallback(Addr address, DataBlock& data,
 416                         bool externalHit, const MachineType mach,
 417                         Cycles initialRequestTime,
 418                         Cycles forwardRequestTime,
 419                         Cycles firstResponseTime)
 420 {
 421     assert(address == makeLineAddress(address));
 422     assert(m_readRequestTable.count(makeLineAddress(address)));
 423
 424     RequestTable::iterator i = m_readRequestTable.find(address);
 425     assert(i != m_readRequestTable.end());
 426     SequencerRequest* request = i->second;
 427
 428     m_readRequestTable.erase(i);
 429     markRemoved();
 430
 431     assert((request->m_type == RubyRequestType_LD) ||
 432            (request->m_type == RubyRequestType_IFETCH));
 433
 434     hitCallback(request, data, true, mach, externalHit,
 435                 initialRequestTime, forwardRequestTime, firstResponseTime);
 436 }
 437
 438 void
 439 Sequencer::hitCallback(SequencerRequest* srequest, DataBlock& data,
 440                        bool llscSuccess,
 441                        const MachineType mach, const bool externalHit,
 442                        const Cycles initialRequestTime,
 443                        const Cycles forwardRequestTime,
 444                        const Cycles firstResponseTime)
 445 {
 446     warn_once("Replacement policy updates recently became the responsibility "
 447               "of SLICC state machines. Make sure to setMRU() near callbacks "
 448               "in .sm files!");
 449
 450     PacketPtr pkt = srequest->pkt;
 451     Addr request_address(pkt->getAddr());
 452     RubyRequestType type = srequest->m_type;
 453     Cycles issued_time = srequest->issue_time;
 454
 455     assert(curCycle() >= issued_time);
 456     Cycles total_latency = curCycle() - issued_time;
 457
 458     // Profile the latency for all demand accesses.
 459     recordMissLatency(total_latency, type, mach, externalHit, issued_time,
 460                       initialRequestTime, forwardRequestTime,
 461                       firstResponseTime, curCycle());
 462
 463     DPRINTFR(ProtocolTrace, "%15s %3s %10s%20s %6s>%-6s %#x %d cycles\n",
 464              curTick(), m_version, "Seq",
 465              llscSuccess ? "Done" : "SC_Failed", "", "",
 466              printAddress(request_address), total_latency);
 467
 468     // update the data unless it is a non-data-carrying flush
 469     if (RubySystem::getWarmupEnabled()) {
 470         data.setData(pkt->getConstPtr<uint8_t>(),
 471                      getOffset(request_address), pkt->getSize());
 472     } else if (!pkt->isFlush()) {
 473         if ((type == RubyRequestType_LD) ||
 474             (type == RubyRequestType_IFETCH) ||
 475             (type == RubyRequestType_RMW_Read) ||
 476             (type == RubyRequestType_Locked_RMW_Read) ||
 477             (type == RubyRequestType_Load_Linked)) {
 478             memcpy(pkt->getPtr<uint8_t>(),
 479                    data.getData(getOffset(request_address), pkt->getSize()),
 480                    pkt->getSize());
 481             DPRINTF(RubySequencer, "read data %s\n", data);
 482         } else if (pkt->req->isSwap()) {
 483             std::vector<uint8_t> overwrite_val(pkt->getSize());
 484             memcpy(&overwrite_val[0], pkt->getConstPtr<uint8_t>(),
 485                    pkt->getSize());
 486             memcpy(pkt->getPtr<uint8_t>(),
 487                    data.getData(getOffset(request_address), pkt->getSize()),
 488                    pkt->getSize());
 489             data.setData(&overwrite_val[0],
 490                          getOffset(request_address), pkt->getSize());
 491             DPRINTF(RubySequencer, "swap data %s\n", data);
 492         } else if (type != RubyRequestType_Store_Conditional || llscSuccess) {
 493             // Types of stores set the actual data here, apart from
 494             // failed Store Conditional requests
 495             data.setData(pkt->getConstPtr<uint8_t>(),
 496                          getOffset(request_address), pkt->getSize());
 497             DPRINTF(RubySequencer, "set data %s\n", data);
 498         }
 499     }
 500
 501     // If using the RubyTester, update the RubyTester sender state's
 502     // subBlock with the recieved data.  The tester will later access
 503     // this state.
 504     if (m_usingRubyTester) {
 505         DPRINTF(RubySequencer, "hitCallback %s 0x%x using RubyTester\n",
 506                 pkt->cmdString(), pkt->getAddr());
 507         RubyTester::SenderState* testerSenderState =
 508             pkt->findNextSenderState<RubyTester::SenderState>();
 509         assert(testerSenderState);
 510         testerSenderState->subBlock.mergeFrom(data);
 511     }
 512
 513     delete srequest;
 514
 515     RubySystem *rs = m_ruby_system;
 516     if (RubySystem::getWarmupEnabled()) {
 517         assert(pkt->req);
 518         delete pkt->req;
 519         delete pkt;
 520         rs->m_cache_recorder->enqueueNextFetchRequest();
 521     } else if (RubySystem::getCooldownEnabled()) {
 522         delete pkt;
 523         rs->m_cache_recorder->enqueueNextFlushRequest();
 524     } else {
 525         ruby_hit_callback(pkt);
 526         testDrainComplete();
 527     }
 528 }
 529
 530 bool
 531 Sequencer::empty() const
 532 {
 533     return m_writeRequestTable.empty() && m_readRequestTable.empty();
 534 }
 535
 536 RequestStatus
 537 Sequencer::makeRequest(PacketPtr pkt)
 538 {
 539     if (m_outstanding_count >= m_max_outstanding_requests) {
 540         return RequestStatus_BufferFull;
 541     }
 542
 543     RubyRequestType primary_type = RubyRequestType_NULL;
 544     RubyRequestType secondary_type = RubyRequestType_NULL;
 545
 546     if (pkt->isLLSC()) {
 547         //
 548         // Alpha LL/SC instructions need to be handled carefully by the cache
 549         // coherence protocol to ensure they follow the proper semantics. In
 550         // particular, by identifying the operations as atomic, the protocol
 551         // should understand that migratory sharing optimizations should not
 552         // be performed (i.e. a load between the LL and SC should not steal
 553         // away exclusive permission).
 554         //
 555         if (pkt->isWrite()) {
 556             DPRINTF(RubySequencer, "Issuing SC\n");
 557             primary_type = RubyRequestType_Store_Conditional;
 558         } else {
 559             DPRINTF(RubySequencer, "Issuing LL\n");
 560             assert(pkt->isRead());
 561             primary_type = RubyRequestType_Load_Linked;
 562         }
 563         secondary_type = RubyRequestType_ATOMIC;
 564     } else if (pkt->req->isLockedRMW()) {
 565         //
 566         // x86 locked instructions are translated to store cache coherence
 567         // requests because these requests should always be treated as read
 568         // exclusive operations and should leverage any migratory sharing
 569         // optimization built into the protocol.
 570         //
 571         if (pkt->isWrite()) {
 572             DPRINTF(RubySequencer, "Issuing Locked RMW Write\n");
 573             primary_type = RubyRequestType_Locked_RMW_Write;
 574         } else {
 575             DPRINTF(RubySequencer, "Issuing Locked RMW Read\n");
 576             assert(pkt->isRead());
 577             primary_type = RubyRequestType_Locked_RMW_Read;
 578         }
 579         secondary_type = RubyRequestType_ST;
 580     } else {
 581         //
 582         // To support SwapReq, we need to check isWrite() first: a SwapReq
 583         // should always be treated like a write, but since a SwapReq implies
 584         // both isWrite() and isRead() are true, check isWrite() first here.
 585         //
 586         if (pkt->isWrite()) {
 587             //
 588             // Note: M5 packets do not differentiate ST from RMW_Write
 589             //
 590             primary_type = secondary_type = RubyRequestType_ST;
 591         } else if (pkt->isRead()) {
 592             if (pkt->req->isInstFetch()) {
 593                 primary_type = secondary_type = RubyRequestType_IFETCH;
 594             } else {
 595                 bool storeCheck = false;
 596                 // only X86 need the store check
 597                 if (system->getArch() == Arch::X86ISA) {
 598                     uint32_t flags = pkt->req->getFlags();
 599                     storeCheck = flags &
 600                         (X86ISA::StoreCheck << X86ISA::FlagShift);
 601                 }
 602                 if (storeCheck) {
 603                     primary_type = RubyRequestType_RMW_Read;
 604                     secondary_type = RubyRequestType_ST;
 605                 } else {
 606                     primary_type = secondary_type = RubyRequestType_LD;
 607                 }
 608             }
 609         } else if (pkt->isFlush()) {
 610           primary_type = secondary_type = RubyRequestType_FLUSH;
 611         } else {
 612             panic("Unsupported ruby packet type\n");
 613         }
 614     }
 615
 616     RequestStatus status = insertRequest(pkt, primary_type);
 617     if (status != RequestStatus_Ready)
 618         return status;
 619
 620     issueRequest(pkt, secondary_type);
 621
 622     // TODO: issue hardware prefetches here
 623     return RequestStatus_Issued;
 624 }
 625
 626 void
 627 Sequencer::issueRequest(PacketPtr pkt, RubyRequestType secondary_type)
 628 {
 629     assert(pkt != NULL);
 630     ContextID proc_id = pkt->req->hasContextId() ?
 631         pkt->req->contextId() : InvalidContextID;
 632
 633     ContextID core_id = coreId();
 634
 635     // If valid, copy the pc to the ruby request
 636     Addr pc = 0;
 637     if (pkt->req->hasPC()) {
 638         pc = pkt->req->getPC();
 639     }
 640
 641     // check if the packet has data as for example prefetch and flush
 642     // requests do not
 643     std::shared_ptr<RubyRequest> msg =
 644         std::make_shared<RubyRequest>(clockEdge(), pkt->getAddr(),
 645                                       pkt->isFlush() ?
 646                                       nullptr : pkt->getPtr<uint8_t>(),
 647                                       pkt->getSize(), pc, secondary_type,
 648                                       RubyAccessMode_Supervisor, pkt,
 649                                       PrefetchBit_No, proc_id, core_id);
 650
 651     DPRINTFR(ProtocolTrace, "%15s %3s %10s%20s %6s>%-6s %#x %s\n",
 652             curTick(), m_version, "Seq", "Begin", "", "",
 653             printAddress(msg->getPhysicalAddress()),
 654             RubyRequestType_to_string(secondary_type));
 655
 656     // The Sequencer currently assesses instruction and data cache hit latency
 657     // for the top-level caches at the beginning of a memory access.
 658     // TODO: Eventually, this latency should be moved to represent the actual
 659     // cache access latency portion of the memory access. This will require
 660     // changing cache controller protocol files to assess the latency on the
 661     // access response path.
 662     Cycles latency(0);  // Initialize to zero to catch misconfigured latency
 663     if (secondary_type == RubyRequestType_IFETCH)
 664         latency = m_inst_cache_hit_latency;
 665     else
 666         latency = m_data_cache_hit_latency;
 667
 668     // Send the message to the cache controller
 669     assert(latency > 0);
 670
 671     assert(m_mandatory_q_ptr != NULL);
 672     m_mandatory_q_ptr->enqueue(msg, clockEdge(), cyclesToTicks(latency));
 673 }
 674
 675 template <class KEY, class VALUE>
 676 std::ostream &
 677 operator<<(ostream &out, const std::unordered_map<KEY, VALUE> &map)
 678 {
 679     auto i = map.begin();
 680     auto end = map.end();
 681
 682     out << "[";
 683     for (; i != end; ++i)
 684         out << " " << i->first << "=" << i->second;
 685     out << " ]";
 686
 687     return out;
 688 }
 689
 690 void
 691 Sequencer::print(ostream& out) const
 692 {
 693     out << "[Sequencer: " << m_version
 694         << ", outstanding requests: " << m_outstanding_count
 695         << ", read request table: " << m_readRequestTable
 696         << ", write request table: " << m_writeRequestTable
 697         << "]";
 698 }
 699
 700 // this can be called from setState whenever coherence permissions are
 701 // upgraded when invoked, coherence violations will be checked for the
 702 // given block
 703 void
 704 Sequencer::checkCoherence(Addr addr)
 705 {
 706 #ifdef CHECK_COHERENCE
 707     m_ruby_system->checkGlobalCoherenceInvariant(addr);
 708 #endif
 709 }
 710
 711 void
 712 Sequencer::recordRequestType(SequencerRequestType requestType) {
 713     DPRINTF(RubyStats, "Recorded statistic: %s\n",
 714             SequencerRequestType_to_string(requestType));
 715 }
 716
 717
 718 void
 719 Sequencer::evictionCallback(Addr address)
 720 {
 721     ruby_eviction_callback(address);
 722 }
 723
 724 void
 725 Sequencer::regStats()
 726 {
 727     RubyPort::regStats();
 728
 729     m_store_waiting_on_load
 730         .name(name() + ".store_waiting_on_load")
 731         .desc("Number of times a store aliased with a pending load")
 732         .flags(Stats::nozero);
 733     m_store_waiting_on_store
 734         .name(name() + ".store_waiting_on_store")
 735         .desc("Number of times a store aliased with a pending store")
 736         .flags(Stats::nozero);
 737     m_load_waiting_on_load
 738         .name(name() + ".load_waiting_on_load")
 739         .desc("Number of times a load aliased with a pending load")
 740         .flags(Stats::nozero);
 741     m_load_waiting_on_store
 742         .name(name() + ".load_waiting_on_store")
 743         .desc("Number of times a load aliased with a pending store")
 744         .flags(Stats::nozero);
 745
 746     // These statistical variables are not for display.
 747     // The profiler will collate these across different
 748     // sequencers and display those collated statistics.
 749     m_outstandReqHist.init(10);
 750     m_latencyHist.init(10);
 751     m_hitLatencyHist.init(10);
 752     m_missLatencyHist.init(10);
 753
 754     for (int i = 0; i < RubyRequestType_NUM; i++) {
 755         m_typeLatencyHist.push_back(new Stats::Histogram());
 756         m_typeLatencyHist[i]->init(10);
 757
 758         m_hitTypeLatencyHist.push_back(new Stats::Histogram());
 759         m_hitTypeLatencyHist[i]->init(10);
 760
 761         m_missTypeLatencyHist.push_back(new Stats::Histogram());
 762         m_missTypeLatencyHist[i]->init(10);
 763     }
 764
 765     for (int i = 0; i < MachineType_NUM; i++) {
 766         m_hitMachLatencyHist.push_back(new Stats::Histogram());
 767         m_hitMachLatencyHist[i]->init(10);
 768
 769         m_missMachLatencyHist.push_back(new Stats::Histogram());
 770         m_missMachLatencyHist[i]->init(10);
 771
 772         m_IssueToInitialDelayHist.push_back(new Stats::Histogram());
 773         m_IssueToInitialDelayHist[i]->init(10);
 774
 775         m_InitialToForwardDelayHist.push_back(new Stats::Histogram());
 776         m_InitialToForwardDelayHist[i]->init(10);
 777
 778         m_ForwardToFirstResponseDelayHist.push_back(new Stats::Histogram());
 779         m_ForwardToFirstResponseDelayHist[i]->init(10);
 780
 781         m_FirstResponseToCompletionDelayHist.push_back(new Stats::Histogram());
 782         m_FirstResponseToCompletionDelayHist[i]->init(10);
 783     }
 784
 785     for (int i = 0; i < RubyRequestType_NUM; i++) {
 786         m_hitTypeMachLatencyHist.push_back(std::vector<Stats::Histogram *>());
 787         m_missTypeMachLatencyHist.push_back(std::vector<Stats::Histogram *>());
 788
 789         for (int j = 0; j < MachineType_NUM; j++) {
 790             m_hitTypeMachLatencyHist[i].push_back(new Stats::Histogram());
 791             m_hitTypeMachLatencyHist[i][j]->init(10);
 792
 793             m_missTypeMachLatencyHist[i].push_back(new Stats::Histogram());
 794             m_missTypeMachLatencyHist[i][j]->init(10);
 795         }
 796     }
 797 }