src/cpu/base.hh

   1 /*
   2  * Copyright (c) 2011-2013, 2017 ARM Limited
   3  * All rights reserved
   4  *
   5  * The license below extends only to copyright in the software and shall
   6  * not be construed as granting a license to any other intellectual
   7  * property including but not limited to intellectual property relating
   8  * to a hardware implementation of the functionality of the software
   9  * licensed hereunder.  You may use the software subject to the license
  10  * terms below provided that you ensure that this notice is replicated
  11  * unmodified and in its entirety in all distributions of the software,
  12  * modified or unmodified, in source code or in binary form.
  13  *
  14  * Copyright (c) 2002-2005 The Regents of The University of Michigan
  15  * Copyright (c) 2011 Regents of the University of California
  16  * All rights reserved.
  17  *
  18  * Redistribution and use in source and binary forms, with or without
  19  * modification, are permitted provided that the following conditions are
  20  * met: redistributions of source code must retain the above copyright
  21  * notice, this list of conditions and the following disclaimer;
  22  * redistributions in binary form must reproduce the above copyright
  23  * notice, this list of conditions and the following disclaimer in the
  24  * documentation and/or other materials provided with the distribution;
  25  * neither the name of the copyright holders nor the names of its
  26  * contributors may be used to endorse or promote products derived from
  27  * this software without specific prior written permission.
  28  *
  29  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  30  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  31  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  32  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  33  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  34  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  35  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  36  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  37  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  38  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  39  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  40  *
  41  * Authors: Steve Reinhardt
  42  *          Nathan Binkert
  43  *          Rick Strong
  44  */
  45
  46 #ifndef __CPU_BASE_HH__
  47 #define __CPU_BASE_HH__
  48
  49 #include <vector>
  50
  51 // Before we do anything else, check if this build is the NULL ISA,
  52 // and if so stop here
  53 #include "config/the_isa.hh"
  54 #if THE_ISA == NULL_ISA
  55 #include "arch/null/cpu_dummy.hh"
  56 #else
  57 #include "arch/interrupts.hh"
  58 #include "arch/isa_traits.hh"
  59 #include "arch/microcode_rom.hh"
  60 #include "base/statistics.hh"
  61 #include "mem/mem_object.hh"
  62 #include "sim/eventq.hh"
  63 #include "sim/full_system.hh"
  64 #include "sim/insttracer.hh"
  65 #include "sim/probe/pmu.hh"
  66 #include "sim/probe/probe.hh"
  67 #include "sim/system.hh"
  68 #include "debug/Mwait.hh"
  69
  70 class BaseCPU;
  71 struct BaseCPUParams;
  72 class CheckerCPU;
  73 class ThreadContext;
  74
  75 struct AddressMonitor
  76 {
  77     AddressMonitor();
  78     bool doMonitor(PacketPtr pkt);
  79
  80     bool armed;
  81     Addr vAddr;
  82     Addr pAddr;
  83     uint64_t val;
  84     bool waiting;   // 0=normal, 1=mwaiting
  85     bool gotWakeup;
  86 };
  87
  88 class CPUProgressEvent : public Event
  89 {
  90   protected:
  91     Tick _interval;
  92     Counter lastNumInst;
  93     BaseCPU *cpu;
  94     bool _repeatEvent;
  95
  96   public:
  97     CPUProgressEvent(BaseCPU *_cpu, Tick ival = 0);
  98
  99     void process();
 100
 101     void interval(Tick ival) { _interval = ival; }
 102     Tick interval() { return _interval; }
 103
 104     void repeatEvent(bool repeat) { _repeatEvent = repeat; }
 105
 106     virtual const char *description() const;
 107 };
 108
 109 class BaseCPU : public MemObject
 110 {
 111   protected:
 112
 113     /// Instruction count used for SPARC misc register
 114     /// @todo unify this with the counters that cpus individually keep
 115     Tick instCnt;
 116
 117     // every cpu has an id, put it in the base cpu
 118     // Set at initialization, only time a cpuId might change is during a
 119     // takeover (which should be done from within the BaseCPU anyway,
 120     // therefore no setCpuId() method is provided
 121     int _cpuId;
 122
 123     /** Each cpu will have a socket ID that corresponds to its physical location
 124      * in the system. This is usually used to bucket cpu cores under single DVFS
 125      * domain. This information may also be required by the OS to identify the
 126      * cpu core grouping (as in the case of ARM via MPIDR register)
 127      */
 128     const uint32_t _socketId;
 129
 130     /** instruction side request id that must be placed in all requests */
 131     MasterID _instMasterId;
 132
 133     /** data side request id that must be placed in all requests */
 134     MasterID _dataMasterId;
 135
 136     /** An intrenal representation of a task identifier within gem5. This is
 137      * used so the CPU can add which taskId (which is an internal representation
 138      * of the OS process ID) to each request so components in the memory system
 139      * can track which process IDs are ultimately interacting with them
 140      */
 141     uint32_t _taskId;
 142
 143     /** The current OS process ID that is executing on this processor. This is
 144      * used to generate a taskId */
 145     uint32_t _pid;
 146
 147     /** Is the CPU switched out or active? */
 148     bool _switchedOut;
 149
 150     /** Cache the cache line size that we get from the system */
 151     const unsigned int _cacheLineSize;
 152
 153   public:
 154
 155     /**
 156      * Purely virtual method that returns a reference to the data
 157      * port. All subclasses must implement this method.
 158      *
 159      * @return a reference to the data port
 160      */
 161     virtual MasterPort &getDataPort() = 0;
 162
 163     /**
 164      * Purely virtual method that returns a reference to the instruction
 165      * port. All subclasses must implement this method.
 166      *
 167      * @return a reference to the instruction port
 168      */
 169     virtual MasterPort &getInstPort() = 0;
 170
 171     /** Reads this CPU's ID. */
 172     int cpuId() const { return _cpuId; }
 173
 174     /** Reads this CPU's Socket ID. */
 175     uint32_t socketId() const { return _socketId; }
 176
 177     /** Reads this CPU's unique data requestor ID */
 178     MasterID dataMasterId() { return _dataMasterId; }
 179     /** Reads this CPU's unique instruction requestor ID */
 180     MasterID instMasterId() { return _instMasterId; }
 181
 182     /**
 183      * Get a master port on this CPU. All CPUs have a data and
 184      * instruction port, and this method uses getDataPort and
 185      * getInstPort of the subclasses to resolve the two ports.
 186      *
 187      * @param if_name the port name
 188      * @param idx ignored index
 189      *
 190      * @return a reference to the port with the given name
 191      */
 192     BaseMasterPort &getMasterPort(const std::string &if_name,
 193                                   PortID idx = InvalidPortID) override;
 194
 195     /** Get cpu task id */
 196     uint32_t taskId() const { return _taskId; }
 197     /** Set cpu task id */
 198     void taskId(uint32_t id) { _taskId = id; }
 199
 200     uint32_t getPid() const { return _pid; }
 201     void setPid(uint32_t pid) { _pid = pid; }
 202
 203     inline void workItemBegin() { numWorkItemsStarted++; }
 204     inline void workItemEnd() { numWorkItemsCompleted++; }
 205     // @todo remove me after debugging with legion done
 206     Tick instCount() { return instCnt; }
 207
 208     TheISA::MicrocodeRom microcodeRom;
 209
 210   protected:
 211     std::vector<TheISA::Interrupts*> interrupts;
 212
 213   public:
 214     TheISA::Interrupts *
 215     getInterruptController(ThreadID tid)
 216     {
 217         if (interrupts.empty())
 218             return NULL;
 219
 220         assert(interrupts.size() > tid);
 221         return interrupts[tid];
 222     }
 223
 224     virtual void wakeup(ThreadID tid) = 0;
 225
 226     void
 227     postInterrupt(ThreadID tid, int int_num, int index)
 228     {
 229         interrupts[tid]->post(int_num, index);
 230         if (FullSystem)
 231             wakeup(tid);
 232     }
 233
 234     void
 235     clearInterrupt(ThreadID tid, int int_num, int index)
 236     {
 237         interrupts[tid]->clear(int_num, index);
 238     }
 239
 240     void
 241     clearInterrupts(ThreadID tid)
 242     {
 243         interrupts[tid]->clearAll();
 244     }
 245
 246     bool
 247     checkInterrupts(ThreadContext *tc) const
 248     {
 249         return FullSystem && interrupts[tc->threadId()]->checkInterrupts(tc);
 250     }
 251
 252     void processProfileEvent();
 253     EventFunctionWrapper * profileEvent;
 254
 255   protected:
 256     std::vector<ThreadContext *> threadContexts;
 257
 258     Trace::InstTracer * tracer;
 259
 260   public:
 261
 262
 263     /** Invalid or unknown Pid. Possible when operating system is not present
 264      *  or has not assigned a pid yet */
 265     static const uint32_t invldPid = std::numeric_limits<uint32_t>::max();
 266
 267     // Mask to align PCs to MachInst sized boundaries
 268     static const Addr PCMask = ~((Addr)sizeof(TheISA::MachInst) - 1);
 269
 270     /// Provide access to the tracer pointer
 271     Trace::InstTracer * getTracer() { return tracer; }
 272
 273     /// Notify the CPU that the indicated context is now active.
 274     virtual void activateContext(ThreadID thread_num);
 275
 276     /// Notify the CPU that the indicated context is now suspended.
 277     /// Check if possible to enter a lower power state
 278     virtual void suspendContext(ThreadID thread_num);
 279
 280     /// Notify the CPU that the indicated context is now halted.
 281     virtual void haltContext(ThreadID thread_num);
 282
 283    /// Given a Thread Context pointer return the thread num
 284    int findContext(ThreadContext *tc);
 285
 286    /// Given a thread num get tho thread context for it
 287    virtual ThreadContext *getContext(int tn) { return threadContexts[tn]; }
 288
 289    /// Get the number of thread contexts available
 290    unsigned numContexts() { return threadContexts.size(); }
 291
 292     /// Convert ContextID to threadID
 293     ThreadID contextToThread(ContextID cid)
 294     { return static_cast<ThreadID>(cid - threadContexts[0]->contextId()); }
 295
 296   public:
 297     typedef BaseCPUParams Params;
 298     const Params *params() const
 299     { return reinterpret_cast<const Params *>(_params); }
 300     BaseCPU(Params *params, bool is_checker = false);
 301     virtual ~BaseCPU();
 302
 303     void init() override;
 304     void startup() override;
 305     void regStats() override;
 306
 307     void regProbePoints() override;
 308
 309     void registerThreadContexts();
 310
 311     // Functions to deschedule and reschedule the events to enter the
 312     // power gating sleep before and after checkpoiting respectively.
 313     void deschedulePowerGatingEvent();
 314     void schedulePowerGatingEvent();
 315
 316     /**
 317      * Prepare for another CPU to take over execution.
 318      *
 319      * When this method exits, all internal state should have been
 320      * flushed. After the method returns, the simulator calls
 321      * takeOverFrom() on the new CPU with this CPU as its parameter.
 322      */
 323     virtual void switchOut();
 324
 325     /**
 326      * Load the state of a CPU from the previous CPU object, invoked
 327      * on all new CPUs that are about to be switched in.
 328      *
 329      * A CPU model implementing this method is expected to initialize
 330      * its state from the old CPU and connect its memory (unless they
 331      * are already connected) to the memories connected to the old
 332      * CPU.
 333      *
 334      * @param cpu CPU to initialize read state from.
 335      */
 336     virtual void takeOverFrom(BaseCPU *cpu);
 337
 338     /**
 339      * Flush all TLBs in the CPU.
 340      *
 341      * This method is mainly used to flush stale translations when
 342      * switching CPUs. It is also exported to the Python world to
 343      * allow it to request a TLB flush after draining the CPU to make
 344      * it easier to compare traces when debugging
 345      * handover/checkpointing.
 346      */
 347     void flushTLBs();
 348
 349     /**
 350      * Determine if the CPU is switched out.
 351      *
 352      * @return True if the CPU is switched out, false otherwise.
 353      */
 354     bool switchedOut() const { return _switchedOut; }
 355
 356     /**
 357      * Verify that the system is in a memory mode supported by the
 358      * CPU.
 359      *
 360      * Implementations are expected to query the system for the
 361      * current memory mode and ensure that it is what the CPU model
 362      * expects. If the check fails, the implementation should
 363      * terminate the simulation using fatal().
 364      */
 365     virtual void verifyMemoryMode() const { };
 366
 367     /**
 368      *  Number of threads we're actually simulating (<= SMT_MAX_THREADS).
 369      * This is a constant for the duration of the simulation.
 370      */
 371     ThreadID numThreads;
 372
 373     /**
 374      * Vector of per-thread instruction-based event queues.  Used for
 375      * scheduling events based on number of instructions committed by
 376      * a particular thread.
 377      */
 378     EventQueue **comInstEventQueue;
 379
 380     /**
 381      * Vector of per-thread load-based event queues.  Used for
 382      * scheduling events based on number of loads committed by
 383      *a particular thread.
 384      */
 385     EventQueue **comLoadEventQueue;
 386
 387     System *system;
 388
 389     /**
 390      * Get the cache line size of the system.
 391      */
 392     inline unsigned int cacheLineSize() const { return _cacheLineSize; }
 393
 394     /**
 395      * Serialize this object to the given output stream.
 396      *
 397      * @note CPU models should normally overload the serializeThread()
 398      * method instead of the serialize() method as this provides a
 399      * uniform data format for all CPU models and promotes better code
 400      * reuse.
 401      *
 402      * @param os The stream to serialize to.
 403      */
 404     void serialize(CheckpointOut &cp) const override;
 405
 406     /**
 407      * Reconstruct the state of this object from a checkpoint.
 408      *
 409      * @note CPU models should normally overload the
 410      * unserializeThread() method instead of the unserialize() method
 411      * as this provides a uniform data format for all CPU models and
 412      * promotes better code reuse.
 413
 414      * @param cp The checkpoint use.
 415      * @param section The section name of this object.
 416      */
 417     void unserialize(CheckpointIn &cp) override;
 418
 419     /**
 420      * Serialize a single thread.
 421      *
 422      * @param os The stream to serialize to.
 423      * @param tid ID of the current thread.
 424      */
 425     virtual void serializeThread(CheckpointOut &cp, ThreadID tid) const {};
 426
 427     /**
 428      * Unserialize one thread.
 429      *
 430      * @param cp The checkpoint use.
 431      * @param section The section name of this thread.
 432      * @param tid ID of the current thread.
 433      */
 434     virtual void unserializeThread(CheckpointIn &cp, ThreadID tid) {};
 435
 436     virtual Counter totalInsts() const = 0;
 437
 438     virtual Counter totalOps() const = 0;
 439
 440     /**
 441      * Schedule an event that exits the simulation loops after a
 442      * predefined number of instructions.
 443      *
 444      * This method is usually called from the configuration script to
 445      * get an exit event some time in the future. It is typically used
 446      * when the script wants to simulate for a specific number of
 447      * instructions rather than ticks.
 448      *
 449      * @param tid Thread monitor.
 450      * @param insts Number of instructions into the future.
 451      * @param cause Cause to signal in the exit event.
 452      */
 453     void scheduleInstStop(ThreadID tid, Counter insts, const char *cause);
 454
 455     /**
 456      * Schedule an event that exits the simulation loops after a
 457      * predefined number of load operations.
 458      *
 459      * This method is usually called from the configuration script to
 460      * get an exit event some time in the future. It is typically used
 461      * when the script wants to simulate for a specific number of
 462      * loads rather than ticks.
 463      *
 464      * @param tid Thread monitor.
 465      * @param loads Number of load instructions into the future.
 466      * @param cause Cause to signal in the exit event.
 467      */
 468     void scheduleLoadStop(ThreadID tid, Counter loads, const char *cause);
 469
 470     /**
 471      * Get the number of instructions executed by the specified thread
 472      * on this CPU. Used by Python to control simulation.
 473      *
 474      * @param tid Thread monitor
 475      * @return Number of instructions executed
 476      */
 477     uint64_t getCurrentInstCount(ThreadID tid);
 478
 479   public:
 480     /**
 481      * @{
 482      * @name PMU Probe points.
 483      */
 484
 485     /**
 486      * Helper method to trigger PMU probes for a committed
 487      * instruction.
 488      *
 489      * @param inst Instruction that just committed
 490      */
 491     virtual void probeInstCommit(const StaticInstPtr &inst);
 492
 493    protected:
 494     /**
 495      * Helper method to instantiate probe points belonging to this
 496      * object.
 497      *
 498      * @param name Name of the probe point.
 499      * @return A unique_ptr to the new probe point.
 500      */
 501     ProbePoints::PMUUPtr pmuProbePoint(const char *name);
 502
 503     /**
 504      * Instruction commit probe point.
 505      *
 506      * This probe point is triggered whenever one or more instructions
 507      * are committed. It is normally triggered once for every
 508      * instruction. However, CPU models committing bundles of
 509      * instructions may call notify once for the entire bundle.
 510      */
 511     ProbePoints::PMUUPtr ppRetiredInsts;
 512
 513     /** Retired load instructions */
 514     ProbePoints::PMUUPtr ppRetiredLoads;
 515     /** Retired store instructions */
 516     ProbePoints::PMUUPtr ppRetiredStores;
 517
 518     /** Retired branches (any type) */
 519     ProbePoints::PMUUPtr ppRetiredBranches;
 520
 521     /** CPU cycle counter even if any thread Context is suspended*/
 522     ProbePoints::PMUUPtr ppAllCycles;
 523
 524     /** CPU cycle counter, only counts if any thread contexts is active **/
 525     ProbePoints::PMUUPtr ppActiveCycles;
 526
 527     /**
 528      * ProbePoint that signals transitions of threadContexts sets.
 529      * The ProbePoint reports information through it bool parameter.
 530      * - If the parameter is true then the last enabled threadContext of the
 531      * CPU object was disabled.
 532      * - If the parameter is false then a threadContext was enabled, all the
 533      * remaining threadContexts are disabled.
 534      */
 535     ProbePointArg<bool> *ppSleeping;
 536     /** @} */
 537
 538     enum CPUState {
 539         CPU_STATE_ON,
 540         CPU_STATE_SLEEP,
 541         CPU_STATE_WAKEUP
 542     };
 543
 544     Cycles previousCycle;
 545     CPUState previousState;
 546
 547     /** base method keeping track of cycle progression **/
 548     inline void updateCycleCounters(CPUState state)
 549     {
 550         uint32_t delta = curCycle() - previousCycle;
 551
 552         if (previousState == CPU_STATE_ON) {
 553             ppActiveCycles->notify(delta);
 554         }
 555
 556         switch (state)
 557         {
 558           case CPU_STATE_WAKEUP:
 559             ppSleeping->notify(false);
 560             break;
 561           case CPU_STATE_SLEEP:
 562             ppSleeping->notify(true);
 563             break;
 564           default:
 565             break;
 566         }
 567
 568         ppAllCycles->notify(delta);
 569
 570         previousCycle = curCycle();
 571         previousState = state;
 572     }
 573
 574     // Function tracing
 575   private:
 576     bool functionTracingEnabled;
 577     std::ostream *functionTraceStream;
 578     Addr currentFunctionStart;
 579     Addr currentFunctionEnd;
 580     Tick functionEntryTick;
 581     void enableFunctionTrace();
 582     void traceFunctionsInternal(Addr pc);
 583
 584   private:
 585     static std::vector<BaseCPU *> cpuList;   //!< Static global cpu list
 586
 587   public:
 588     void traceFunctions(Addr pc)
 589     {
 590         if (functionTracingEnabled)
 591             traceFunctionsInternal(pc);
 592     }
 593
 594     static int numSimulatedCPUs() { return cpuList.size(); }
 595     static Counter numSimulatedInsts()
 596     {
 597         Counter total = 0;
 598
 599         int size = cpuList.size();
 600         for (int i = 0; i < size; ++i)
 601             total += cpuList[i]->totalInsts();
 602
 603         return total;
 604     }
 605
 606     static Counter numSimulatedOps()
 607     {
 608         Counter total = 0;
 609
 610         int size = cpuList.size();
 611         for (int i = 0; i < size; ++i)
 612             total += cpuList[i]->totalOps();
 613
 614         return total;
 615     }
 616
 617   public:
 618     // Number of CPU cycles simulated
 619     Stats::Scalar numCycles;
 620     Stats::Scalar numWorkItemsStarted;
 621     Stats::Scalar numWorkItemsCompleted;
 622
 623   private:
 624     std::vector<AddressMonitor> addressMonitor;
 625
 626   public:
 627     void armMonitor(ThreadID tid, Addr address);
 628     bool mwait(ThreadID tid, PacketPtr pkt);
 629     void mwaitAtomic(ThreadID tid, ThreadContext *tc, BaseTLB *dtb);
 630     AddressMonitor *getCpuAddrMonitor(ThreadID tid)
 631     {
 632         assert(tid < numThreads);
 633         return &addressMonitor[tid];
 634     }
 635
 636     bool waitForRemoteGDB() const;
 637
 638     Cycles syscallRetryLatency;
 639
 640   // Enables CPU to enter power gating on a configurable cycle count
 641   protected:
 642     void enterPwrGating();
 643
 644     const Cycles pwrGatingLatency;
 645     const bool powerGatingOnIdle;
 646     EventFunctionWrapper enterPwrGatingEvent;
 647 };
 648
 649 #endif // THE_ISA == NULL_ISA
 650
 651 #endif // __CPU_BASE_HH__