src/mem/cache/base.hh

   1 /*
   2  * Copyright (c) 2003-2005 The Regents of The University of Michigan
   3  * All rights reserved.
   4  *
   5  * Redistribution and use in source and binary forms, with or without
   6  * modification, are permitted provided that the following conditions are
   7  * met: redistributions of source code must retain the above copyright
   8  * notice, this list of conditions and the following disclaimer;
   9  * redistributions in binary form must reproduce the above copyright
  10  * notice, this list of conditions and the following disclaimer in the
  11  * documentation and/or other materials provided with the distribution;
  12  * neither the name of the copyright holders nor the names of its
  13  * contributors may be used to endorse or promote products derived from
  14  * this software without specific prior written permission.
  15  *
  16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  17  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  18  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  19  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  20  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  21  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  22  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  23  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  24  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  25  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  26  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  27  *
  28  * Authors: Erik Hallnor
  29  *          Steve Reinhardt
  30  *          Ron Dreslinski
  31  */
  32
  33 /**
  34  * @file
  35  * Declares a basic cache interface BaseCache.
  36  */
  37
  38 #ifndef __BASE_CACHE_HH__
  39 #define __BASE_CACHE_HH__
  40
  41 #include <algorithm>
  42 #include <list>
  43 #include <string>
  44 #include <vector>
  45
  46 #include "base/misc.hh"
  47 #include "base/statistics.hh"
  48 #include "base/trace.hh"
  49 #include "base/types.hh"
  50 #include "debug/Cache.hh"
  51 #include "debug/CachePort.hh"
  52 #include "mem/cache/mshr_queue.hh"
  53 #include "mem/mem_object.hh"
  54 #include "mem/packet.hh"
  55 #include "mem/request.hh"
  56 #include "mem/tport.hh"
  57 #include "params/BaseCache.hh"
  58 #include "sim/eventq.hh"
  59 #include "sim/full_system.hh"
  60 #include "sim/sim_exit.hh"
  61
  62 class MSHR;
  63 /**
  64  * A basic cache interface. Implements some common functions for speed.
  65  */
  66 class BaseCache : public MemObject
  67 {
  68     /**
  69      * Indexes to enumerate the MSHR queues.
  70      */
  71     enum MSHRQueueIndex {
  72         MSHRQueue_MSHRs,
  73         MSHRQueue_WriteBuffer
  74     };
  75
  76     /**
  77      * Reasons for caches to be blocked.
  78      */
  79     enum BlockedCause {
  80         Blocked_NoMSHRs = MSHRQueue_MSHRs,
  81         Blocked_NoWBBuffers = MSHRQueue_WriteBuffer,
  82         Blocked_NoTargets,
  83         NUM_BLOCKED_CAUSES
  84     };
  85
  86   public:
  87     /**
  88      * Reasons for cache to request a bus.
  89      */
  90     enum RequestCause {
  91         Request_MSHR = MSHRQueue_MSHRs,
  92         Request_WB = MSHRQueue_WriteBuffer,
  93         Request_PF,
  94         NUM_REQUEST_CAUSES
  95     };
  96
  97   private:
  98
  99     class CachePort : public SimpleTimingPort
 100     {
 101       public:
 102         BaseCache *cache;
 103
 104       protected:
 105         CachePort(const std::string &_name, BaseCache *_cache,
 106                   const std::string &_label);
 107
 108         virtual void recvStatusChange(Status status);
 109
 110         virtual unsigned deviceBlockSize() const;
 111
 112         bool recvRetryCommon();
 113
 114         typedef EventWrapper<Port, &Port::sendRetry>
 115             SendRetryEvent;
 116
 117         const std::string label;
 118
 119       public:
 120         void setOtherPort(CachePort *_otherPort) { otherPort = _otherPort; }
 121
 122         void setBlocked();
 123
 124         void clearBlocked();
 125
 126         bool checkFunctional(PacketPtr pkt);
 127
 128         CachePort *otherPort;
 129
 130         bool blocked;
 131
 132         bool mustSendRetry;
 133
 134         void requestBus(RequestCause cause, Tick time)
 135         {
 136             DPRINTF(CachePort, "Asserting bus request for cause %d\n", cause);
 137             if (!waitingOnRetry) {
 138                 schedSendEvent(time);
 139             }
 140         }
 141
 142         void respond(PacketPtr pkt, Tick time) {
 143             schedSendTiming(pkt, time);
 144         }
 145     };
 146
 147   public: //Made public so coherence can get at it.
 148     CachePort *cpuSidePort;
 149     CachePort *memSidePort;
 150
 151   protected:
 152
 153     /** Miss status registers */
 154     MSHRQueue mshrQueue;
 155
 156     /** Write/writeback buffer */
 157     MSHRQueue writeBuffer;
 158
 159     MSHR *allocateBufferInternal(MSHRQueue *mq, Addr addr, int size,
 160                                  PacketPtr pkt, Tick time, bool requestBus)
 161     {
 162         MSHR *mshr = mq->allocate(addr, size, pkt, time, order++);
 163
 164         if (mq->isFull()) {
 165             setBlocked((BlockedCause)mq->index);
 166         }
 167
 168         if (requestBus) {
 169             requestMemSideBus((RequestCause)mq->index, time);
 170         }
 171
 172         return mshr;
 173     }
 174
 175     void markInServiceInternal(MSHR *mshr, PacketPtr pkt)
 176     {
 177         MSHRQueue *mq = mshr->queue;
 178         bool wasFull = mq->isFull();
 179         mq->markInService(mshr, pkt);
 180         if (wasFull && !mq->isFull()) {
 181             clearBlocked((BlockedCause)mq->index);
 182         }
 183     }
 184
 185     /** Block size of this cache */
 186     const unsigned blkSize;
 187
 188     /**
 189      * The latency of a hit in this device.
 190      */
 191     int hitLatency;
 192
 193     /** The number of targets for each MSHR. */
 194     const int numTarget;
 195
 196     /** Do we forward snoops from mem side port through to cpu side port? */
 197     bool forwardSnoops;
 198
 199     /** Is this cache a toplevel cache (e.g. L1, I/O cache). If so we should
 200      * never try to forward ownership and similar optimizations to the cpu
 201      * side */
 202     bool isTopLevel;
 203
 204     /**
 205      * Bit vector of the blocking reasons for the access path.
 206      * @sa #BlockedCause
 207      */
 208     uint8_t blocked;
 209
 210     /** Increasing order number assigned to each incoming request. */
 211     uint64_t order;
 212
 213     /** Stores time the cache blocked for statistics. */
 214     Tick blockedCycle;
 215
 216     /** Pointer to the MSHR that has no targets. */
 217     MSHR *noTargetMSHR;
 218
 219     /** The number of misses to trigger an exit event. */
 220     Counter missCount;
 221
 222     /** The drain event. */
 223     Event *drainEvent;
 224
 225     /**
 226      * The address range to which the cache responds on the CPU side.
 227      * Normally this is all possible memory addresses. */
 228     Range<Addr> addrRange;
 229
 230     /** number of cpus sharing this cache - from config file */
 231     int _numCpus;
 232
 233   public:
 234     int numCpus() { return _numCpus; }
 235     // Statistics
 236     /**
 237      * @addtogroup CacheStatistics
 238      * @{
 239      */
 240
 241     /** Number of hits per thread for each type of command. @sa Packet::Command */
 242     Stats::Vector hits[MemCmd::NUM_MEM_CMDS];
 243     /** Number of hits for demand accesses. */
 244     Stats::Formula demandHits;
 245     /** Number of hit for all accesses. */
 246     Stats::Formula overallHits;
 247
 248     /** Number of misses per thread for each type of command. @sa Packet::Command */
 249     Stats::Vector misses[MemCmd::NUM_MEM_CMDS];
 250     /** Number of misses for demand accesses. */
 251     Stats::Formula demandMisses;
 252     /** Number of misses for all accesses. */
 253     Stats::Formula overallMisses;
 254
 255     /**
 256      * Total number of cycles per thread/command spent waiting for a miss.
 257      * Used to calculate the average miss latency.
 258      */
 259     Stats::Vector missLatency[MemCmd::NUM_MEM_CMDS];
 260     /** Total number of cycles spent waiting for demand misses. */
 261     Stats::Formula demandMissLatency;
 262     /** Total number of cycles spent waiting for all misses. */
 263     Stats::Formula overallMissLatency;
 264
 265     /** The number of accesses per command and thread. */
 266     Stats::Formula accesses[MemCmd::NUM_MEM_CMDS];
 267     /** The number of demand accesses. */
 268     Stats::Formula demandAccesses;
 269     /** The number of overall accesses. */
 270     Stats::Formula overallAccesses;
 271
 272     /** The miss rate per command and thread. */
 273     Stats::Formula missRate[MemCmd::NUM_MEM_CMDS];
 274     /** The miss rate of all demand accesses. */
 275     Stats::Formula demandMissRate;
 276     /** The miss rate for all accesses. */
 277     Stats::Formula overallMissRate;
 278
 279     /** The average miss latency per command and thread. */
 280     Stats::Formula avgMissLatency[MemCmd::NUM_MEM_CMDS];
 281     /** The average miss latency for demand misses. */
 282     Stats::Formula demandAvgMissLatency;
 283     /** The average miss latency for all misses. */
 284     Stats::Formula overallAvgMissLatency;
 285
 286     /** The total number of cycles blocked for each blocked cause. */
 287     Stats::Vector blocked_cycles;
 288     /** The number of times this cache blocked for each blocked cause. */
 289     Stats::Vector blocked_causes;
 290
 291     /** The average number of cycles blocked for each blocked cause. */
 292     Stats::Formula avg_blocked;
 293
 294     /** The number of fast writes (WH64) performed. */
 295     Stats::Scalar fastWrites;
 296
 297     /** The number of cache copies performed. */
 298     Stats::Scalar cacheCopies;
 299
 300     /** Number of blocks written back per thread. */
 301     Stats::Vector writebacks;
 302
 303     /** Number of misses that hit in the MSHRs per command and thread. */
 304     Stats::Vector mshr_hits[MemCmd::NUM_MEM_CMDS];
 305     /** Demand misses that hit in the MSHRs. */
 306     Stats::Formula demandMshrHits;
 307     /** Total number of misses that hit in the MSHRs. */
 308     Stats::Formula overallMshrHits;
 309
 310     /** Number of misses that miss in the MSHRs, per command and thread. */
 311     Stats::Vector mshr_misses[MemCmd::NUM_MEM_CMDS];
 312     /** Demand misses that miss in the MSHRs. */
 313     Stats::Formula demandMshrMisses;
 314     /** Total number of misses that miss in the MSHRs. */
 315     Stats::Formula overallMshrMisses;
 316
 317     /** Number of misses that miss in the MSHRs, per command and thread. */
 318     Stats::Vector mshr_uncacheable[MemCmd::NUM_MEM_CMDS];
 319     /** Total number of misses that miss in the MSHRs. */
 320     Stats::Formula overallMshrUncacheable;
 321
 322     /** Total cycle latency of each MSHR miss, per command and thread. */
 323     Stats::Vector mshr_miss_latency[MemCmd::NUM_MEM_CMDS];
 324     /** Total cycle latency of demand MSHR misses. */
 325     Stats::Formula demandMshrMissLatency;
 326     /** Total cycle latency of overall MSHR misses. */
 327     Stats::Formula overallMshrMissLatency;
 328
 329     /** Total cycle latency of each MSHR miss, per command and thread. */
 330     Stats::Vector mshr_uncacheable_lat[MemCmd::NUM_MEM_CMDS];
 331     /** Total cycle latency of overall MSHR misses. */
 332     Stats::Formula overallMshrUncacheableLatency;
 333
 334 #if 0
 335     /** The total number of MSHR accesses per command and thread. */
 336     Stats::Formula mshrAccesses[MemCmd::NUM_MEM_CMDS];
 337     /** The total number of demand MSHR accesses. */
 338     Stats::Formula demandMshrAccesses;
 339     /** The total number of MSHR accesses. */
 340     Stats::Formula overallMshrAccesses;
 341 #endif
 342
 343     /** The miss rate in the MSHRs pre command and thread. */
 344     Stats::Formula mshrMissRate[MemCmd::NUM_MEM_CMDS];
 345     /** The demand miss rate in the MSHRs. */
 346     Stats::Formula demandMshrMissRate;
 347     /** The overall miss rate in the MSHRs. */
 348     Stats::Formula overallMshrMissRate;
 349
 350     /** The average latency of an MSHR miss, per command and thread. */
 351     Stats::Formula avgMshrMissLatency[MemCmd::NUM_MEM_CMDS];
 352     /** The average latency of a demand MSHR miss. */
 353     Stats::Formula demandAvgMshrMissLatency;
 354     /** The average overall latency of an MSHR miss. */
 355     Stats::Formula overallAvgMshrMissLatency;
 356
 357     /** The average latency of an MSHR miss, per command and thread. */
 358     Stats::Formula avgMshrUncacheableLatency[MemCmd::NUM_MEM_CMDS];
 359     /** The average overall latency of an MSHR miss. */
 360     Stats::Formula overallAvgMshrUncacheableLatency;
 361
 362     /** The number of times a thread hit its MSHR cap. */
 363     Stats::Vector mshr_cap_events;
 364     /** The number of times software prefetches caused the MSHR to block. */
 365     Stats::Vector soft_prefetch_mshr_full;
 366
 367     Stats::Scalar mshr_no_allocate_misses;
 368
 369     /**
 370      * @}
 371      */
 372
 373     /**
 374      * Register stats for this object.
 375      */
 376     virtual void regStats();
 377
 378   public:
 379     typedef BaseCacheParams Params;
 380     BaseCache(const Params *p);
 381     ~BaseCache() {}
 382
 383     virtual void init();
 384
 385     /**
 386      * Query block size of a cache.
 387      * @return  The block size
 388      */
 389     unsigned
 390     getBlockSize() const
 391     {
 392         return blkSize;
 393     }
 394
 395
 396     Addr blockAlign(Addr addr) const { return (addr & ~(Addr(blkSize - 1))); }
 397
 398
 399     const Range<Addr> &getAddrRange() const { return addrRange; }
 400
 401     MSHR *allocateMissBuffer(PacketPtr pkt, Tick time, bool requestBus)
 402     {
 403         assert(!pkt->req->isUncacheable());
 404         return allocateBufferInternal(&mshrQueue,
 405                                       blockAlign(pkt->getAddr()), blkSize,
 406                                       pkt, time, requestBus);
 407     }
 408
 409     MSHR *allocateWriteBuffer(PacketPtr pkt, Tick time, bool requestBus)
 410     {
 411         assert(pkt->isWrite() && !pkt->isRead());
 412         return allocateBufferInternal(&writeBuffer,
 413                                       pkt->getAddr(), pkt->getSize(),
 414                                       pkt, time, requestBus);
 415     }
 416
 417     MSHR *allocateUncachedReadBuffer(PacketPtr pkt, Tick time, bool requestBus)
 418     {
 419         assert(pkt->req->isUncacheable());
 420         assert(pkt->isRead());
 421         return allocateBufferInternal(&mshrQueue,
 422                                       pkt->getAddr(), pkt->getSize(),
 423                                       pkt, time, requestBus);
 424     }
 425
 426     /**
 427      * Returns true if the cache is blocked for accesses.
 428      */
 429     bool isBlocked()
 430     {
 431         return blocked != 0;
 432     }
 433
 434     /**
 435      * Marks the access path of the cache as blocked for the given cause. This
 436      * also sets the blocked flag in the slave interface.
 437      * @param cause The reason for the cache blocking.
 438      */
 439     void setBlocked(BlockedCause cause)
 440     {
 441         uint8_t flag = 1 << cause;
 442         if (blocked == 0) {
 443             blocked_causes[cause]++;
 444             blockedCycle = curTick();
 445             cpuSidePort->setBlocked();
 446         }
 447         blocked |= flag;
 448         DPRINTF(Cache,"Blocking for cause %d, mask=%d\n", cause, blocked);
 449     }
 450
 451     /**
 452      * Marks the cache as unblocked for the given cause. This also clears the
 453      * blocked flags in the appropriate interfaces.
 454      * @param cause The newly unblocked cause.
 455      * @warning Calling this function can cause a blocked request on the bus to
 456      * access the cache. The cache must be in a state to handle that request.
 457      */
 458     void clearBlocked(BlockedCause cause)
 459     {
 460         uint8_t flag = 1 << cause;
 461         blocked &= ~flag;
 462         DPRINTF(Cache,"Unblocking for cause %d, mask=%d\n", cause, blocked);
 463         if (blocked == 0) {
 464             blocked_cycles[cause] += curTick() - blockedCycle;
 465             cpuSidePort->clearBlocked();
 466         }
 467     }
 468
 469     /**
 470      * Request the master bus for the given cause and time.
 471      * @param cause The reason for the request.
 472      * @param time The time to make the request.
 473      */
 474     void requestMemSideBus(RequestCause cause, Tick time)
 475     {
 476         memSidePort->requestBus(cause, time);
 477     }
 478
 479     /**
 480      * Clear the master bus request for the given cause.
 481      * @param cause The request reason to clear.
 482      */
 483     void deassertMemSideBusRequest(RequestCause cause)
 484     {
 485         // Obsolete... we no longer signal bus requests explicitly so
 486         // we can't deassert them.  Leaving this in as a no-op since
 487         // the prefetcher calls it to indicate that it no longer wants
 488         // to request a prefetch, and someday that might be
 489         // interesting again.
 490     }
 491
 492     virtual unsigned int drain(Event *de);
 493
 494     virtual bool inCache(Addr addr) = 0;
 495
 496     virtual bool inMissQueue(Addr addr) = 0;
 497
 498     void incMissCount(PacketPtr pkt, int id)
 499     {
 500
 501         if (pkt->cmd == MemCmd::Writeback) {
 502             assert(id == -1);
 503             misses[pkt->cmdToIndex()][0]++;
 504             /* same thing for writeback hits as misses - no context id
 505              * available, meanwhile writeback hit/miss stats are not used
 506              * in any aggregate hit/miss calculations, so just lump them all
 507              * in bucket 0 */
 508         } else if (FullSystem && id == -1) {
 509             // Device accesses have id -1
 510             // lump device accesses into their own bucket
 511             misses[pkt->cmdToIndex()][_numCpus]++;
 512         } else {
 513             misses[pkt->cmdToIndex()][id % _numCpus]++;
 514         }
 515
 516         if (missCount) {
 517             --missCount;
 518             if (missCount == 0)
 519                 exitSimLoop("A cache reached the maximum miss count");
 520         }
 521     }
 522     void incHitCount(PacketPtr pkt, int id)
 523     {
 524
 525         /* Writeback requests don't have a context id associated with
 526          * them, so attributing a hit to a -1 context id is obviously a
 527          * problem.  I've noticed in the stats that hits are split into
 528          * demand and non-demand hits - neither of which include writeback
 529          * hits, so here, I'll just put the writeback hits into bucket 0
 530          * since it won't mess with any other stats -hsul */
 531         if (pkt->cmd == MemCmd::Writeback) {
 532             assert(id == -1);
 533             hits[pkt->cmdToIndex()][0]++;
 534         } else if (FullSystem && id == -1) {
 535             // Device accesses have id -1
 536             // lump device accesses into their own bucket
 537             hits[pkt->cmdToIndex()][_numCpus]++;
 538         } else {
 539             /* the % is necessary in case there are switch cpus */
 540             hits[pkt->cmdToIndex()][id % _numCpus]++;
 541         }
 542     }
 543
 544 };
 545
 546 #endif //__BASE_CACHE_HH__