src/mem/dram_ctrl.hh

   1 /*
   2  * Copyright (c) 2012-2016 ARM Limited
   3  * All rights reserved
   4  *
   5  * The license below extends only to copyright in the software and shall
   6  * not be construed as granting a license to any other intellectual
   7  * property including but not limited to intellectual property relating
   8  * to a hardware implementation of the functionality of the software
   9  * licensed hereunder.  You may use the software subject to the license
  10  * terms below provided that you ensure that this notice is replicated
  11  * unmodified and in its entirety in all distributions of the software,
  12  * modified or unmodified, in source code or in binary form.
  13  *
  14  * Copyright (c) 2013 Amin Farmahini-Farahani
  15  * All rights reserved.
  16  *
  17  * Redistribution and use in source and binary forms, with or without
  18  * modification, are permitted provided that the following conditions are
  19  * met: redistributions of source code must retain the above copyright
  20  * notice, this list of conditions and the following disclaimer;
  21  * redistributions in binary form must reproduce the above copyright
  22  * notice, this list of conditions and the following disclaimer in the
  23  * documentation and/or other materials provided with the distribution;
  24  * neither the name of the copyright holders nor the names of its
  25  * contributors may be used to endorse or promote products derived from
  26  * this software without specific prior written permission.
  27  *
  28  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  29  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  30  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  31  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  32  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  33  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  34  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  35  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  36  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  37  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  38  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  39  *
  40  * Authors: Andreas Hansson
  41  *          Ani Udipi
  42  *          Neha Agarwal
  43  *          Omar Naji
  44  *          Matthias Jung
  45  *          Wendy Elsasser
  46  */
  47
  48 /**
  49  * @file
  50  * DRAMCtrl declaration
  51  */
  52
  53 #ifndef __MEM_DRAM_CTRL_HH__
  54 #define __MEM_DRAM_CTRL_HH__
  55
  56 #include <deque>
  57 #include <string>
  58 #include <unordered_set>
  59
  60 #include "base/callback.hh"
  61 #include "base/statistics.hh"
  62 #include "enums/AddrMap.hh"
  63 #include "enums/MemSched.hh"
  64 #include "enums/PageManage.hh"
  65 #include "mem/abstract_mem.hh"
  66 #include "mem/qport.hh"
  67 #include "params/DRAMCtrl.hh"
  68 #include "sim/eventq.hh"
  69 #include "mem/drampower.hh"
  70
  71 /**
  72  * The DRAM controller is a single-channel memory controller capturing
  73  * the most important timing constraints associated with a
  74  * contemporary DRAM. For multi-channel memory systems, the controller
  75  * is combined with a crossbar model, with the channel address
  76  * interleaving taking part in the crossbar.
  77  *
  78  * As a basic design principle, this controller
  79  * model is not cycle callable, but instead uses events to: 1) decide
  80  * when new decisions can be made, 2) when resources become available,
  81  * 3) when things are to be considered done, and 4) when to send
  82  * things back. Through these simple principles, the model delivers
  83  * high performance, and lots of flexibility, allowing users to
  84  * evaluate the system impact of a wide range of memory technologies,
  85  * such as DDR3/4, LPDDR2/3/4, WideIO1/2, HBM and HMC.
  86  *
  87  * For more details, please see Hansson et al, "Simulating DRAM
  88  * controllers for future system architecture exploration",
  89  * Proc. ISPASS, 2014. If you use this model as part of your research
  90  * please cite the paper.
  91  *
  92  * The low-power functionality implements a staggered powerdown
  93  * similar to that described in "Optimized Active and Power-Down Mode
  94  * Refresh Control in 3D-DRAMs" by Jung et al, VLSI-SoC, 2014.
  95  */
  96 class DRAMCtrl : public AbstractMemory
  97 {
  98
  99   private:
 100
 101     // For now, make use of a queued slave port to avoid dealing with
 102     // flow control for the responses being sent back
 103     class MemoryPort : public QueuedSlavePort
 104     {
 105
 106         RespPacketQueue queue;
 107         DRAMCtrl& memory;
 108
 109       public:
 110
 111         MemoryPort(const std::string& name, DRAMCtrl& _memory);
 112
 113       protected:
 114
 115         Tick recvAtomic(PacketPtr pkt);
 116
 117         void recvFunctional(PacketPtr pkt);
 118
 119         bool recvTimingReq(PacketPtr);
 120
 121         virtual AddrRangeList getAddrRanges() const;
 122
 123     };
 124
 125     /**
 126      * Our incoming port, for a multi-ported controller add a crossbar
 127      * in front of it
 128      */
 129     MemoryPort port;
 130
 131     /**
 132      * Remeber if the memory system is in timing mode
 133      */
 134     bool isTimingMode;
 135
 136     /**
 137      * Remember if we have to retry a request when available.
 138      */
 139     bool retryRdReq;
 140     bool retryWrReq;
 141
 142     /**
 143      * Bus state used to control the read/write switching and drive
 144      * the scheduling of the next request.
 145      */
 146     enum BusState {
 147         READ = 0,
 148         WRITE,
 149     };
 150
 151     BusState busState;
 152
 153     /* bus state for next request event triggered */
 154     BusState busStateNext;
 155
 156     /**
 157      * Simple structure to hold the values needed to keep track of
 158      * commands for DRAMPower
 159      */
 160     struct Command {
 161        Data::MemCommand::cmds type;
 162        uint8_t bank;
 163        Tick timeStamp;
 164
 165        constexpr Command(Data::MemCommand::cmds _type, uint8_t _bank,
 166                          Tick time_stamp)
 167             : type(_type), bank(_bank), timeStamp(time_stamp)
 168         { }
 169     };
 170
 171     /**
 172      * A basic class to track the bank state, i.e. what row is
 173      * currently open (if any), when is the bank free to accept a new
 174      * column (read/write) command, when can it be precharged, and
 175      * when can it be activated.
 176      *
 177      * The bank also keeps track of how many bytes have been accessed
 178      * in the open row since it was opened.
 179      */
 180     class Bank
 181     {
 182
 183       public:
 184
 185         static const uint32_t NO_ROW = -1;
 186
 187         uint32_t openRow;
 188         uint8_t bank;
 189         uint8_t bankgr;
 190
 191         Tick colAllowedAt;
 192         Tick preAllowedAt;
 193         Tick actAllowedAt;
 194
 195         uint32_t rowAccesses;
 196         uint32_t bytesAccessed;
 197
 198         Bank() :
 199             openRow(NO_ROW), bank(0), bankgr(0),
 200             colAllowedAt(0), preAllowedAt(0), actAllowedAt(0),
 201             rowAccesses(0), bytesAccessed(0)
 202         { }
 203     };
 204
 205
 206     /**
 207      * The power state captures the different operational states of
 208      * the DRAM and interacts with the bus read/write state machine,
 209      * and the refresh state machine.
 210      *
 211      * PWR_IDLE      : The idle state in which all banks are closed
 212      *                 From here can transition to:  PWR_REF, PWR_ACT,
 213      *                 PWR_PRE_PDN
 214      *
 215      * PWR_REF       : Auto-refresh state.  Will transition when refresh is
 216      *                 complete based on power state prior to PWR_REF
 217      *                 From here can transition to:  PWR_IDLE, PWR_PRE_PDN,
 218      *                 PWR_SREF
 219      *
 220      * PWR_SREF      : Self-refresh state.  Entered after refresh if
 221      *                 previous state was PWR_PRE_PDN
 222      *                 From here can transition to:  PWR_IDLE
 223      *
 224      * PWR_PRE_PDN   : Precharge power down state
 225      *                 From here can transition to:  PWR_REF, PWR_IDLE
 226      *
 227      * PWR_ACT       : Activate state in which one or more banks are open
 228      *                 From here can transition to:  PWR_IDLE, PWR_ACT_PDN
 229      *
 230      * PWR_ACT_PDN   : Activate power down state
 231      *                 From here can transition to:  PWR_ACT
 232      */
 233      enum PowerState {
 234          PWR_IDLE = 0,
 235          PWR_REF,
 236          PWR_SREF,
 237          PWR_PRE_PDN,
 238          PWR_ACT,
 239          PWR_ACT_PDN
 240      };
 241
 242     /**
 243      * The refresh state is used to control the progress of the
 244      * refresh scheduling. When normal operation is in progress the
 245      * refresh state is idle. Once tREFI has elasped, a refresh event
 246      * is triggered to start the following STM transitions which are
 247      * used to issue a refresh and return back to normal operation
 248      *
 249      * REF_IDLE      : IDLE state used during normal operation
 250      *                 From here can transition to:  REF_DRAIN
 251      *
 252      * REF_SREF_EXIT : Exiting a self-refresh; refresh event scheduled
 253      *                 after self-refresh exit completes
 254      *                 From here can transition to:  REF_DRAIN
 255      *
 256      * REF_DRAIN     : Drain state in which on going accesses complete.
 257      *                 From here can transition to:  REF_PD_EXIT
 258      *
 259      * REF_PD_EXIT   : Evaluate pwrState and issue wakeup if needed
 260      *                 Next state dependent on whether banks are open
 261      *                 From here can transition to:  REF_PRE, REF_START
 262      *
 263      * REF_PRE       : Close (precharge) all open banks
 264      *                 From here can transition to:  REF_START
 265      *
 266      * REF_START     : Issue refresh command and update DRAMPower stats
 267      *                 From here can transition to:  REF_RUN
 268      *
 269      * REF_RUN       : Refresh running, waiting for tRFC to expire
 270      *                 From here can transition to:  REF_IDLE, REF_SREF_EXIT
 271      */
 272      enum RefreshState {
 273          REF_IDLE = 0,
 274          REF_DRAIN,
 275          REF_PD_EXIT,
 276          REF_SREF_EXIT,
 277          REF_PRE,
 278          REF_START,
 279          REF_RUN
 280      };
 281
 282     /**
 283      * Rank class includes a vector of banks. Refresh and Power state
 284      * machines are defined per rank. Events required to change the
 285      * state of the refresh and power state machine are scheduled per
 286      * rank. This class allows the implementation of rank-wise refresh
 287      * and rank-wise power-down.
 288      */
 289     class Rank : public EventManager
 290     {
 291
 292       private:
 293
 294         /**
 295          * A reference to the parent DRAMCtrl instance
 296          */
 297         DRAMCtrl& memory;
 298
 299         /**
 300          * Since we are taking decisions out of order, we need to keep
 301          * track of what power transition is happening at what time
 302          */
 303         PowerState pwrStateTrans;
 304
 305         /**
 306          * Previous low-power state, which will be re-entered after refresh.
 307          */
 308         PowerState pwrStatePostRefresh;
 309
 310         /**
 311          * Track when we transitioned to the current power state
 312          */
 313         Tick pwrStateTick;
 314
 315         /**
 316          * Keep track of when a refresh is due.
 317          */
 318         Tick refreshDueAt;
 319
 320         /*
 321          * Command energies
 322          */
 323         Stats::Scalar actEnergy;
 324         Stats::Scalar preEnergy;
 325         Stats::Scalar readEnergy;
 326         Stats::Scalar writeEnergy;
 327         Stats::Scalar refreshEnergy;
 328
 329         /*
 330          * Active Background Energy
 331          */
 332         Stats::Scalar actBackEnergy;
 333
 334         /*
 335          * Precharge Background Energy
 336          */
 337         Stats::Scalar preBackEnergy;
 338
 339         /*
 340          * Active Power-Down Energy
 341          */
 342         Stats::Scalar actPowerDownEnergy;
 343
 344         /*
 345          * Precharge Power-Down Energy
 346          */
 347         Stats::Scalar prePowerDownEnergy;
 348
 349         /*
 350          * self Refresh Energy
 351          */
 352         Stats::Scalar selfRefreshEnergy;
 353
 354         Stats::Scalar totalEnergy;
 355         Stats::Scalar averagePower;
 356
 357         /**
 358          * Stat to track total DRAM idle time
 359          *
 360          */
 361         Stats::Scalar totalIdleTime;
 362
 363         /**
 364          * Track time spent in each power state.
 365          */
 366         Stats::Vector pwrStateTime;
 367
 368         /**
 369          * Function to update Power Stats
 370          */
 371         void updatePowerStats();
 372
 373         /**
 374          * Schedule a power state transition in the future, and
 375          * potentially override an already scheduled transition.
 376          *
 377          * @param pwr_state Power state to transition to
 378          * @param tick Tick when transition should take place
 379          */
 380         void schedulePowerEvent(PowerState pwr_state, Tick tick);
 381
 382       public:
 383
 384         /**
 385          * Current power state.
 386          */
 387         PowerState pwrState;
 388
 389        /**
 390          * current refresh state
 391          */
 392         RefreshState refreshState;
 393
 394         /**
 395          * rank is in or transitioning to power-down or self-refresh
 396          */
 397         bool inLowPowerState;
 398
 399         /**
 400          * Current Rank index
 401          */
 402         uint8_t rank;
 403
 404        /**
 405          * Track number of packets in read queue going to this rank
 406          */
 407         uint32_t readEntries;
 408
 409        /**
 410          * Track number of packets in write queue going to this rank
 411          */
 412         uint32_t writeEntries;
 413
 414         /**
 415          * Number of ACT, RD, and WR events currently scheduled
 416          * Incremented when a refresh event is started as well
 417          * Used to determine when a low-power state can be entered
 418          */
 419         uint8_t outstandingEvents;
 420
 421         /**
 422          * delay power-down and self-refresh exit until this requirement is met
 423          */
 424         Tick wakeUpAllowedAt;
 425
 426         /**
 427          * One DRAMPower instance per rank
 428          */
 429         DRAMPower power;
 430
 431         /**
 432          * List of comamnds issued, to be sent to DRAMPpower at refresh
 433          * and stats dump.  Keep commands here since commands to different
 434          * banks are added out of order.  Will only pass commands up to
 435          * curTick() to DRAMPower after sorting.
 436          */
 437         std::vector<Command> cmdList;
 438
 439         /**
 440          * Vector of Banks. Each rank is made of several devices which in
 441          * term are made from several banks.
 442          */
 443         std::vector<Bank> banks;
 444
 445         /**
 446          *  To track number of banks which are currently active for
 447          *  this rank.
 448          */
 449         unsigned int numBanksActive;
 450
 451         /** List to keep track of activate ticks */
 452         std::deque<Tick> actTicks;
 453
 454         Rank(DRAMCtrl& _memory, const DRAMCtrlParams* _p, int rank);
 455
 456         const std::string name() const
 457         {
 458             return csprintf("%s_%d", memory.name(), rank);
 459         }
 460
 461         /**
 462          * Kick off accounting for power and refresh states and
 463          * schedule initial refresh.
 464          *
 465          * @param ref_tick Tick for first refresh
 466          */
 467         void startup(Tick ref_tick);
 468
 469         /**
 470          * Stop the refresh events.
 471          */
 472         void suspend();
 473
 474         /**
 475          * Check if the current rank is available for scheduling.
 476          * Rank will be unavailable if refresh is ongoing.
 477          * This includes refresh events explicitly scheduled from the the
 478          * controller or memory initiated events which will occur during
 479          * self-refresh mode.
 480          *
 481          * @param Return true if the rank is idle from a refresh point of view
 482          */
 483         bool isAvailable() const { return refreshState == REF_IDLE; }
 484
 485         /**
 486          * Check if the current rank has all banks closed and is not
 487          * in a low power state
 488          *
 489          * @param Return true if the rank is idle from a bank
 490          *        and power point of view
 491          */
 492         bool inPwrIdleState() const { return pwrState == PWR_IDLE; }
 493
 494         /**
 495          * Trigger a self-refresh exit if there are entries enqueued
 496          * Exit if there are any read entries regardless of the bus state.
 497          * If we are currently issuing write commands, exit if we have any
 498          * write commands enqueued as well.
 499          * Could expand this in the future to analyze state of entire queue
 500          * if needed.
 501          *
 502          * @return boolean indicating self-refresh exit should be scheduled
 503          */
 504         bool forceSelfRefreshExit() const {
 505             return (readEntries != 0) ||
 506                    ((memory.busStateNext == WRITE) && (writeEntries != 0));
 507         }
 508
 509         /**
 510          * Check if the current rank is idle and should enter a low-pwer state
 511          *
 512          * @param Return true if the there are no read commands in Q
 513          *                    and there are no outstanding events
 514          */
 515         bool lowPowerEntryReady() const;
 516
 517         /**
 518          * Let the rank check if it was waiting for requests to drain
 519          * to allow it to transition states.
 520          */
 521         void checkDrainDone();
 522
 523         /**
 524          * Push command out of cmdList queue that are scheduled at
 525          * or before curTick() to DRAMPower library
 526          * All commands before curTick are guaranteed to be complete
 527          * and can safely be flushed.
 528          */
 529         void flushCmdList();
 530
 531         /*
 532          * Function to register Stats
 533          */
 534         void regStats();
 535
 536         /**
 537          * Computes stats just prior to dump event
 538          */
 539         void computeStats();
 540
 541         /**
 542          * Schedule a transition to power-down (sleep)
 543          *
 544          * @param pwr_state Power state to transition to
 545          * @param tick Absolute tick when transition should take place
 546          */
 547         void powerDownSleep(PowerState pwr_state, Tick tick);
 548
 549        /**
 550          * schedule and event to wake-up from power-down or self-refresh
 551          * and update bank timing parameters
 552          *
 553          * @param exit_delay Relative tick defining the delay required between
 554          *                   low-power exit and the next command
 555          */
 556         void scheduleWakeUpEvent(Tick exit_delay);
 557
 558         void processWriteDoneEvent();
 559         EventFunctionWrapper writeDoneEvent;
 560
 561         void processActivateEvent();
 562         EventFunctionWrapper activateEvent;
 563
 564         void processPrechargeEvent();
 565         EventFunctionWrapper prechargeEvent;
 566
 567         void processRefreshEvent();
 568         EventFunctionWrapper refreshEvent;
 569
 570         void processPowerEvent();
 571         EventFunctionWrapper powerEvent;
 572
 573         void processWakeUpEvent();
 574         EventFunctionWrapper wakeUpEvent;
 575
 576     };
 577
 578     // define the process to compute stats on simulation exit
 579     // defined per rank as the per rank stats are based on state
 580     // transition and periodically updated, requiring re-sync at
 581     // exit.
 582     class RankDumpCallback : public Callback
 583     {
 584         Rank *ranks;
 585       public:
 586         RankDumpCallback(Rank *r) : ranks(r) {}
 587         virtual void process() { ranks->computeStats(); };
 588     };
 589
 590     /**
 591      * A burst helper helps organize and manage a packet that is larger than
 592      * the DRAM burst size. A system packet that is larger than the burst size
 593      * is split into multiple DRAM packets and all those DRAM packets point to
 594      * a single burst helper such that we know when the whole packet is served.
 595      */
 596     class BurstHelper {
 597
 598       public:
 599
 600         /** Number of DRAM bursts requred for a system packet **/
 601         const unsigned int burstCount;
 602
 603         /** Number of DRAM bursts serviced so far for a system packet **/
 604         unsigned int burstsServiced;
 605
 606         BurstHelper(unsigned int _burstCount)
 607             : burstCount(_burstCount), burstsServiced(0)
 608         { }
 609     };
 610
 611     /**
 612      * A DRAM packet stores packets along with the timestamp of when
 613      * the packet entered the queue, and also the decoded address.
 614      */
 615     class DRAMPacket {
 616
 617       public:
 618
 619         /** When did request enter the controller */
 620         const Tick entryTime;
 621
 622         /** When will request leave the controller */
 623         Tick readyTime;
 624
 625         /** This comes from the outside world */
 626         const PacketPtr pkt;
 627
 628         const bool isRead;
 629
 630         /** Will be populated by address decoder */
 631         const uint8_t rank;
 632         const uint8_t bank;
 633         const uint32_t row;
 634
 635         /**
 636          * Bank id is calculated considering banks in all the ranks
 637          * eg: 2 ranks each with 8 banks, then bankId = 0 --> rank0, bank0 and
 638          * bankId = 8 --> rank1, bank0
 639          */
 640         const uint16_t bankId;
 641
 642         /**
 643          * The starting address of the DRAM packet.
 644          * This address could be unaligned to burst size boundaries. The
 645          * reason is to keep the address offset so we can accurately check
 646          * incoming read packets with packets in the write queue.
 647          */
 648         Addr addr;
 649
 650         /**
 651          * The size of this dram packet in bytes
 652          * It is always equal or smaller than DRAM burst size
 653          */
 654         unsigned int size;
 655
 656         /**
 657          * A pointer to the BurstHelper if this DRAMPacket is a split packet
 658          * If not a split packet (common case), this is set to NULL
 659          */
 660         BurstHelper* burstHelper;
 661         Bank& bankRef;
 662         Rank& rankRef;
 663
 664         DRAMPacket(PacketPtr _pkt, bool is_read, uint8_t _rank, uint8_t _bank,
 665                    uint32_t _row, uint16_t bank_id, Addr _addr,
 666                    unsigned int _size, Bank& bank_ref, Rank& rank_ref)
 667             : entryTime(curTick()), readyTime(curTick()),
 668               pkt(_pkt), isRead(is_read), rank(_rank), bank(_bank), row(_row),
 669               bankId(bank_id), addr(_addr), size(_size), burstHelper(NULL),
 670               bankRef(bank_ref), rankRef(rank_ref)
 671         { }
 672
 673     };
 674
 675     /**
 676      * Bunch of things requires to setup "events" in gem5
 677      * When event "respondEvent" occurs for example, the method
 678      * processRespondEvent is called; no parameters are allowed
 679      * in these methods
 680      */
 681     void processNextReqEvent();
 682     EventFunctionWrapper nextReqEvent;
 683
 684     void processRespondEvent();
 685     EventFunctionWrapper respondEvent;
 686
 687     /**
 688      * Check if the read queue has room for more entries
 689      *
 690      * @param pktCount The number of entries needed in the read queue
 691      * @return true if read queue is full, false otherwise
 692      */
 693     bool readQueueFull(unsigned int pktCount) const;
 694
 695     /**
 696      * Check if the write queue has room for more entries
 697      *
 698      * @param pktCount The number of entries needed in the write queue
 699      * @return true if write queue is full, false otherwise
 700      */
 701     bool writeQueueFull(unsigned int pktCount) const;
 702
 703     /**
 704      * When a new read comes in, first check if the write q has a
 705      * pending request to the same address.\ If not, decode the
 706      * address to populate rank/bank/row, create one or mutliple
 707      * "dram_pkt", and push them to the back of the read queue.\
 708      * If this is the only
 709      * read request in the system, schedule an event to start
 710      * servicing it.
 711      *
 712      * @param pkt The request packet from the outside world
 713      * @param pktCount The number of DRAM bursts the pkt
 714      * translate to. If pkt size is larger then one full burst,
 715      * then pktCount is greater than one.
 716      */
 717     void addToReadQueue(PacketPtr pkt, unsigned int pktCount);
 718
 719     /**
 720      * Decode the incoming pkt, create a dram_pkt and push to the
 721      * back of the write queue. \If the write q length is more than
 722      * the threshold specified by the user, ie the queue is beginning
 723      * to get full, stop reads, and start draining writes.
 724      *
 725      * @param pkt The request packet from the outside world
 726      * @param pktCount The number of DRAM bursts the pkt
 727      * translate to. If pkt size is larger then one full burst,
 728      * then pktCount is greater than one.
 729      */
 730     void addToWriteQueue(PacketPtr pkt, unsigned int pktCount);
 731
 732     /**
 733      * Actually do the DRAM access - figure out the latency it
 734      * will take to service the req based on bank state, channel state etc
 735      * and then update those states to account for this request.\ Based
 736      * on this, update the packet's "readyTime" and move it to the
 737      * response q from where it will eventually go back to the outside
 738      * world.
 739      *
 740      * @param pkt The DRAM packet created from the outside world pkt
 741      */
 742     void doDRAMAccess(DRAMPacket* dram_pkt);
 743
 744     /**
 745      * When a packet reaches its "readyTime" in the response Q,
 746      * use the "access()" method in AbstractMemory to actually
 747      * create the response packet, and send it back to the outside
 748      * world requestor.
 749      *
 750      * @param pkt The packet from the outside world
 751      * @param static_latency Static latency to add before sending the packet
 752      */
 753     void accessAndRespond(PacketPtr pkt, Tick static_latency);
 754
 755     /**
 756      * Address decoder to figure out physical mapping onto ranks,
 757      * banks, and rows. This function is called multiple times on the same
 758      * system packet if the pakcet is larger than burst of the memory. The
 759      * dramPktAddr is used for the offset within the packet.
 760      *
 761      * @param pkt The packet from the outside world
 762      * @param dramPktAddr The starting address of the DRAM packet
 763      * @param size The size of the DRAM packet in bytes
 764      * @param isRead Is the request for a read or a write to DRAM
 765      * @return A DRAMPacket pointer with the decoded information
 766      */
 767     DRAMPacket* decodeAddr(PacketPtr pkt, Addr dramPktAddr, unsigned int size,
 768                            bool isRead);
 769
 770     /**
 771      * The memory schduler/arbiter - picks which request needs to
 772      * go next, based on the specified policy such as FCFS or FR-FCFS
 773      * and moves it to the head of the queue.
 774      * Prioritizes accesses to the same rank as previous burst unless
 775      * controller is switching command type.
 776      *
 777      * @param queue Queued requests to consider
 778      * @param extra_col_delay Any extra delay due to a read/write switch
 779      * @return true if a packet is scheduled to a rank which is available else
 780      * false
 781      */
 782     bool chooseNext(std::deque<DRAMPacket*>& queue, Tick extra_col_delay);
 783
 784     /**
 785      * For FR-FCFS policy reorder the read/write queue depending on row buffer
 786      * hits and earliest bursts available in DRAM
 787      *
 788      * @param queue Queued requests to consider
 789      * @param extra_col_delay Any extra delay due to a read/write switch
 790      * @return true if a packet is scheduled to a rank which is available else
 791      * false
 792      */
 793     bool reorderQueue(std::deque<DRAMPacket*>& queue, Tick extra_col_delay);
 794
 795     /**
 796      * Find which are the earliest banks ready to issue an activate
 797      * for the enqueued requests. Assumes maximum of 64 banks per DIMM
 798      * Also checks if the bank is already prepped.
 799      *
 800      * @param queue Queued requests to consider
 801      * @param time of seamless burst command
 802      * @return One-hot encoded mask of bank indices
 803      * @return boolean indicating burst can issue seamlessly, with no gaps
 804      */
 805     std::pair<uint64_t, bool> minBankPrep(const std::deque<DRAMPacket*>& queue,
 806                                           Tick min_col_at) const;
 807
 808     /**
 809      * Keep track of when row activations happen, in order to enforce
 810      * the maximum number of activations in the activation window. The
 811      * method updates the time that the banks become available based
 812      * on the current limits.
 813      *
 814      * @param rank_ref Reference to the rank
 815      * @param bank_ref Reference to the bank
 816      * @param act_tick Time when the activation takes place
 817      * @param row Index of the row
 818      */
 819     void activateBank(Rank& rank_ref, Bank& bank_ref, Tick act_tick,
 820                       uint32_t row);
 821
 822     /**
 823      * Precharge a given bank and also update when the precharge is
 824      * done. This will also deal with any stats related to the
 825      * accesses to the open page.
 826      *
 827      * @param rank_ref The rank to precharge
 828      * @param bank_ref The bank to precharge
 829      * @param pre_at Time when the precharge takes place
 830      * @param trace Is this an auto precharge then do not add to trace
 831      */
 832     void prechargeBank(Rank& rank_ref, Bank& bank_ref,
 833                        Tick pre_at, bool trace = true);
 834
 835     /**
 836      * Used for debugging to observe the contents of the queues.
 837      */
 838     void printQs() const;
 839
 840     /**
 841      * Burst-align an address.
 842      *
 843      * @param addr The potentially unaligned address
 844      *
 845      * @return An address aligned to a DRAM burst
 846      */
 847     Addr burstAlign(Addr addr) const { return (addr & ~(Addr(burstSize - 1))); }
 848
 849     /**
 850      * The controller's main read and write queues
 851      */
 852     std::deque<DRAMPacket*> readQueue;
 853     std::deque<DRAMPacket*> writeQueue;
 854
 855     /**
 856      * To avoid iterating over the write queue to check for
 857      * overlapping transactions, maintain a set of burst addresses
 858      * that are currently queued. Since we merge writes to the same
 859      * location we never have more than one address to the same burst
 860      * address.
 861      */
 862     std::unordered_set<Addr> isInWriteQueue;
 863
 864     /**
 865      * Response queue where read packets wait after we're done working
 866      * with them, but it's not time to send the response yet. The
 867      * responses are stored seperately mostly to keep the code clean
 868      * and help with events scheduling. For all logical purposes such
 869      * as sizing the read queue, this and the main read queue need to
 870      * be added together.
 871      */
 872     std::deque<DRAMPacket*> respQueue;
 873
 874     /**
 875      * Vector of ranks
 876      */
 877     std::vector<Rank*> ranks;
 878
 879     /**
 880      * The following are basic design parameters of the memory
 881      * controller, and are initialized based on parameter values.
 882      * The rowsPerBank is determined based on the capacity, number of
 883      * ranks and banks, the burst size, and the row buffer size.
 884      */
 885     const uint32_t deviceSize;
 886     const uint32_t deviceBusWidth;
 887     const uint32_t burstLength;
 888     const uint32_t deviceRowBufferSize;
 889     const uint32_t devicesPerRank;
 890     const uint32_t burstSize;
 891     const uint32_t rowBufferSize;
 892     const uint32_t columnsPerRowBuffer;
 893     const uint32_t columnsPerStripe;
 894     const uint32_t ranksPerChannel;
 895     const uint32_t bankGroupsPerRank;
 896     const bool bankGroupArch;
 897     const uint32_t banksPerRank;
 898     const uint32_t channels;
 899     uint32_t rowsPerBank;
 900     const uint32_t readBufferSize;
 901     const uint32_t writeBufferSize;
 902     const uint32_t writeHighThreshold;
 903     const uint32_t writeLowThreshold;
 904     const uint32_t minWritesPerSwitch;
 905     uint32_t writesThisTime;
 906     uint32_t readsThisTime;
 907
 908     /**
 909      * Basic memory timing parameters initialized based on parameter
 910      * values.
 911      */
 912     const Tick M5_CLASS_VAR_USED tCK;
 913     const Tick tWTR;
 914     const Tick tRTW;
 915     const Tick tCS;
 916     const Tick tBURST;
 917     const Tick tCCD_L;
 918     const Tick tRCD;
 919     const Tick tCL;
 920     const Tick tRP;
 921     const Tick tRAS;
 922     const Tick tWR;
 923     const Tick tRTP;
 924     const Tick tRFC;
 925     const Tick tREFI;
 926     const Tick tRRD;
 927     const Tick tRRD_L;
 928     const Tick tXAW;
 929     const Tick tXP;
 930     const Tick tXS;
 931     const uint32_t activationLimit;
 932
 933     /**
 934      * Memory controller configuration initialized based on parameter
 935      * values.
 936      */
 937     Enums::MemSched memSchedPolicy;
 938     Enums::AddrMap addrMapping;
 939     Enums::PageManage pageMgmt;
 940
 941     /**
 942      * Max column accesses (read and write) per row, before forefully
 943      * closing it.
 944      */
 945     const uint32_t maxAccessesPerRow;
 946
 947     /**
 948      * Pipeline latency of the controller frontend. The frontend
 949      * contribution is added to writes (that complete when they are in
 950      * the write buffer) and reads that are serviced the write buffer.
 951      */
 952     const Tick frontendLatency;
 953
 954     /**
 955      * Pipeline latency of the backend and PHY. Along with the
 956      * frontend contribution, this latency is added to reads serviced
 957      * by the DRAM.
 958      */
 959     const Tick backendLatency;
 960
 961     /**
 962      * Till when has the main data bus been spoken for already?
 963      */
 964     Tick busBusyUntil;
 965
 966     Tick prevArrival;
 967
 968     /**
 969      * The soonest you have to start thinking about the next request
 970      * is the longest access time that can occur before
 971      * busBusyUntil. Assuming you need to precharge, open a new row,
 972      * and access, it is tRP + tRCD + tCL.
 973      */
 974     Tick nextReqTime;
 975
 976     // All statistics that the model needs to capture
 977     Stats::Scalar readReqs;
 978     Stats::Scalar writeReqs;
 979     Stats::Scalar readBursts;
 980     Stats::Scalar writeBursts;
 981     Stats::Scalar bytesReadDRAM;
 982     Stats::Scalar bytesReadWrQ;
 983     Stats::Scalar bytesWritten;
 984     Stats::Scalar bytesReadSys;
 985     Stats::Scalar bytesWrittenSys;
 986     Stats::Scalar servicedByWrQ;
 987     Stats::Scalar mergedWrBursts;
 988     Stats::Scalar neitherReadNorWrite;
 989     Stats::Vector perBankRdBursts;
 990     Stats::Vector perBankWrBursts;
 991     Stats::Scalar numRdRetry;
 992     Stats::Scalar numWrRetry;
 993     Stats::Scalar totGap;
 994     Stats::Vector readPktSize;
 995     Stats::Vector writePktSize;
 996     Stats::Vector rdQLenPdf;
 997     Stats::Vector wrQLenPdf;
 998     Stats::Histogram bytesPerActivate;
 999     Stats::Histogram rdPerTurnAround;
1000     Stats::Histogram wrPerTurnAround;
1001
1002     // Latencies summed over all requests
1003     Stats::Scalar totQLat;
1004     Stats::Scalar totMemAccLat;
1005     Stats::Scalar totBusLat;
1006
1007     // Average latencies per request
1008     Stats::Formula avgQLat;
1009     Stats::Formula avgBusLat;
1010     Stats::Formula avgMemAccLat;
1011
1012     // Average bandwidth
1013     Stats::Formula avgRdBW;
1014     Stats::Formula avgWrBW;
1015     Stats::Formula avgRdBWSys;
1016     Stats::Formula avgWrBWSys;
1017     Stats::Formula peakBW;
1018     Stats::Formula busUtil;
1019     Stats::Formula busUtilRead;
1020     Stats::Formula busUtilWrite;
1021
1022     // Average queue lengths
1023     Stats::Average avgRdQLen;
1024     Stats::Average avgWrQLen;
1025
1026     // Row hit count and rate
1027     Stats::Scalar readRowHits;
1028     Stats::Scalar writeRowHits;
1029     Stats::Formula readRowHitRate;
1030     Stats::Formula writeRowHitRate;
1031     Stats::Formula avgGap;
1032
1033     // DRAM Power Calculation
1034     Stats::Formula pageHitRate;
1035
1036     // Holds the value of the rank of burst issued
1037     uint8_t activeRank;
1038
1039     // timestamp offset
1040     uint64_t timeStampOffset;
1041
1042     /**
1043      * Upstream caches need this packet until true is returned, so
1044      * hold it for deletion until a subsequent call
1045      */
1046     std::unique_ptr<Packet> pendingDelete;
1047
1048     /**
1049      * This function increments the energy when called. If stats are
1050      * dumped periodically, note accumulated energy values will
1051      * appear in the stats (even if the stats are reset). This is a
1052      * result of the energy values coming from DRAMPower, and there
1053      * is currently no support for resetting the state.
1054      *
1055      * @param rank Currrent rank
1056      */
1057     void updatePowerStats(Rank& rank_ref);
1058
1059     /**
1060      * Function for sorting Command structures based on timeStamp
1061      *
1062      * @param a Memory Command
1063      * @param next Memory Command
1064      * @return true if timeStamp of Command 1 < timeStamp of Command 2
1065      */
1066     static bool sortTime(const Command& cmd, const Command& cmd_next) {
1067         return cmd.timeStamp < cmd_next.timeStamp;
1068     };
1069
1070   public:
1071
1072     void regStats() override;
1073
1074     DRAMCtrl(const DRAMCtrlParams* p);
1075
1076     DrainState drain() override;
1077
1078     virtual BaseSlavePort& getSlavePort(const std::string& if_name,
1079                                         PortID idx = InvalidPortID) override;
1080
1081     virtual void init() override;
1082     virtual void startup() override;
1083     virtual void drainResume() override;
1084
1085     /**
1086      * Return true once refresh is complete for all ranks and there are no
1087      * additional commands enqueued.  (only evaluated when draining)
1088      * This will ensure that all banks are closed, power state is IDLE, and
1089      * power stats have been updated
1090      *
1091      * @return true if all ranks have refreshed, with no commands enqueued
1092      *
1093      */
1094     bool allRanksDrained() const;
1095
1096   protected:
1097
1098     Tick recvAtomic(PacketPtr pkt);
1099     void recvFunctional(PacketPtr pkt);
1100     bool recvTimingReq(PacketPtr pkt);
1101
1102 };
1103
1104 #endif //__MEM_DRAM_CTRL_HH__