src/cpu/base.hh

   1 /*
   2  * Copyright (c) 2011-2013 ARM Limited
   3  * All rights reserved
   4  *
   5  * The license below extends only to copyright in the software and shall
   6  * not be construed as granting a license to any other intellectual
   7  * property including but not limited to intellectual property relating
   8  * to a hardware implementation of the functionality of the software
   9  * licensed hereunder.  You may use the software subject to the license
  10  * terms below provided that you ensure that this notice is replicated
  11  * unmodified and in its entirety in all distributions of the software,
  12  * modified or unmodified, in source code or in binary form.
  13  *
  14  * Copyright (c) 2002-2005 The Regents of The University of Michigan
  15  * Copyright (c) 2011 Regents of the University of California
  16  * All rights reserved.
  17  *
  18  * Redistribution and use in source and binary forms, with or without
  19  * modification, are permitted provided that the following conditions are
  20  * met: redistributions of source code must retain the above copyright
  21  * notice, this list of conditions and the following disclaimer;
  22  * redistributions in binary form must reproduce the above copyright
  23  * notice, this list of conditions and the following disclaimer in the
  24  * documentation and/or other materials provided with the distribution;
  25  * neither the name of the copyright holders nor the names of its
  26  * contributors may be used to endorse or promote products derived from
  27  * this software without specific prior written permission.
  28  *
  29  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  30  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  31  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  32  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  33  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  34  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  35  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  36  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  37  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  38  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  39  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  40  *
  41  * Authors: Steve Reinhardt
  42  *          Nathan Binkert
  43  *          Rick Strong
  44  */
  45
  46 #ifndef __CPU_BASE_HH__
  47 #define __CPU_BASE_HH__
  48
  49 #include <vector>
  50
  51 // Before we do anything else, check if this build is the NULL ISA,
  52 // and if so stop here
  53 #include "config/the_isa.hh"
  54 #if THE_ISA == NULL_ISA
  55 #include "arch/null/cpu_dummy.hh"
  56 #else
  57 #include "arch/interrupts.hh"
  58 #include "arch/isa_traits.hh"
  59 #include "arch/microcode_rom.hh"
  60 #include "base/statistics.hh"
  61 #include "mem/mem_object.hh"
  62 #include "sim/eventq.hh"
  63 #include "sim/full_system.hh"
  64 #include "sim/insttracer.hh"
  65 #include "sim/probe/pmu.hh"
  66 #include "sim/system.hh"
  67 #include "debug/Mwait.hh"
  68
  69 class BaseCPU;
  70 struct BaseCPUParams;
  71 class CheckerCPU;
  72 class ThreadContext;
  73
  74 struct AddressMonitor
  75 {
  76     AddressMonitor();
  77     bool doMonitor(PacketPtr pkt);
  78
  79     bool armed;
  80     Addr vAddr;
  81     Addr pAddr;
  82     uint64_t val;
  83     bool waiting;   // 0=normal, 1=mwaiting
  84     bool gotWakeup;
  85 };
  86
  87 class CPUProgressEvent : public Event
  88 {
  89   protected:
  90     Tick _interval;
  91     Counter lastNumInst;
  92     BaseCPU *cpu;
  93     bool _repeatEvent;
  94
  95   public:
  96     CPUProgressEvent(BaseCPU *_cpu, Tick ival = 0);
  97
  98     void process();
  99
 100     void interval(Tick ival) { _interval = ival; }
 101     Tick interval() { return _interval; }
 102
 103     void repeatEvent(bool repeat) { _repeatEvent = repeat; }
 104
 105     virtual const char *description() const;
 106 };
 107
 108 class BaseCPU : public MemObject
 109 {
 110   protected:
 111
 112     /// Instruction count used for SPARC misc register
 113     /// @todo unify this with the counters that cpus individually keep
 114     Tick instCnt;
 115
 116     // every cpu has an id, put it in the base cpu
 117     // Set at initialization, only time a cpuId might change is during a
 118     // takeover (which should be done from within the BaseCPU anyway,
 119     // therefore no setCpuId() method is provided
 120     int _cpuId;
 121
 122     /** Each cpu will have a socket ID that corresponds to its physical location
 123      * in the system. This is usually used to bucket cpu cores under single DVFS
 124      * domain. This information may also be required by the OS to identify the
 125      * cpu core grouping (as in the case of ARM via MPIDR register)
 126      */
 127     const uint32_t _socketId;
 128
 129     /** instruction side request id that must be placed in all requests */
 130     MasterID _instMasterId;
 131
 132     /** data side request id that must be placed in all requests */
 133     MasterID _dataMasterId;
 134
 135     /** An intrenal representation of a task identifier within gem5. This is
 136      * used so the CPU can add which taskId (which is an internal representation
 137      * of the OS process ID) to each request so components in the memory system
 138      * can track which process IDs are ultimately interacting with them
 139      */
 140     uint32_t _taskId;
 141
 142     /** The current OS process ID that is executing on this processor. This is
 143      * used to generate a taskId */
 144     uint32_t _pid;
 145
 146     /** Is the CPU switched out or active? */
 147     bool _switchedOut;
 148
 149     /** Cache the cache line size that we get from the system */
 150     const unsigned int _cacheLineSize;
 151
 152   public:
 153
 154     /**
 155      * Purely virtual method that returns a reference to the data
 156      * port. All subclasses must implement this method.
 157      *
 158      * @return a reference to the data port
 159      */
 160     virtual MasterPort &getDataPort() = 0;
 161
 162     /**
 163      * Purely virtual method that returns a reference to the instruction
 164      * port. All subclasses must implement this method.
 165      *
 166      * @return a reference to the instruction port
 167      */
 168     virtual MasterPort &getInstPort() = 0;
 169
 170     /** Reads this CPU's ID. */
 171     int cpuId() const { return _cpuId; }
 172
 173     /** Reads this CPU's Socket ID. */
 174     uint32_t socketId() const { return _socketId; }
 175
 176     /** Reads this CPU's unique data requestor ID */
 177     MasterID dataMasterId() { return _dataMasterId; }
 178     /** Reads this CPU's unique instruction requestor ID */
 179     MasterID instMasterId() { return _instMasterId; }
 180
 181     /**
 182      * Get a master port on this CPU. All CPUs have a data and
 183      * instruction port, and this method uses getDataPort and
 184      * getInstPort of the subclasses to resolve the two ports.
 185      *
 186      * @param if_name the port name
 187      * @param idx ignored index
 188      *
 189      * @return a reference to the port with the given name
 190      */
 191     BaseMasterPort &getMasterPort(const std::string &if_name,
 192                                   PortID idx = InvalidPortID);
 193
 194     /** Get cpu task id */
 195     uint32_t taskId() const { return _taskId; }
 196     /** Set cpu task id */
 197     void taskId(uint32_t id) { _taskId = id; }
 198
 199     uint32_t getPid() const { return _pid; }
 200     void setPid(uint32_t pid) { _pid = pid; }
 201
 202     inline void workItemBegin() { numWorkItemsStarted++; }
 203     inline void workItemEnd() { numWorkItemsCompleted++; }
 204     // @todo remove me after debugging with legion done
 205     Tick instCount() { return instCnt; }
 206
 207     TheISA::MicrocodeRom microcodeRom;
 208
 209   protected:
 210     TheISA::Interrupts *interrupts;
 211
 212   public:
 213     TheISA::Interrupts *
 214     getInterruptController()
 215     {
 216         return interrupts;
 217     }
 218
 219     virtual void wakeup() = 0;
 220
 221     void
 222     postInterrupt(int int_num, int index)
 223     {
 224         interrupts->post(int_num, index);
 225         if (FullSystem)
 226             wakeup();
 227     }
 228
 229     void
 230     clearInterrupt(int int_num, int index)
 231     {
 232         interrupts->clear(int_num, index);
 233     }
 234
 235     void
 236     clearInterrupts()
 237     {
 238         interrupts->clearAll();
 239     }
 240
 241     bool
 242     checkInterrupts(ThreadContext *tc) const
 243     {
 244         return FullSystem && interrupts->checkInterrupts(tc);
 245     }
 246
 247     class ProfileEvent : public Event
 248     {
 249       private:
 250         BaseCPU *cpu;
 251         Tick interval;
 252
 253       public:
 254         ProfileEvent(BaseCPU *cpu, Tick interval);
 255         void process();
 256     };
 257     ProfileEvent *profileEvent;
 258
 259   protected:
 260     std::vector<ThreadContext *> threadContexts;
 261
 262     Trace::InstTracer * tracer;
 263
 264   public:
 265
 266     // Mask to align PCs to MachInst sized boundaries
 267     static const Addr PCMask = ~((Addr)sizeof(TheISA::MachInst) - 1);
 268
 269     /// Provide access to the tracer pointer
 270     Trace::InstTracer * getTracer() { return tracer; }
 271
 272     /// Notify the CPU that the indicated context is now active.
 273     virtual void activateContext(ThreadID thread_num) {}
 274
 275     /// Notify the CPU that the indicated context is now suspended.
 276     virtual void suspendContext(ThreadID thread_num) {}
 277
 278     /// Notify the CPU that the indicated context is now halted.
 279     virtual void haltContext(ThreadID thread_num) {}
 280
 281    /// Given a Thread Context pointer return the thread num
 282    int findContext(ThreadContext *tc);
 283
 284    /// Given a thread num get tho thread context for it
 285    virtual ThreadContext *getContext(int tn) { return threadContexts[tn]; }
 286
 287    /// Get the number of thread contexts available
 288    unsigned numContexts() { return threadContexts.size(); }
 289
 290   public:
 291     typedef BaseCPUParams Params;
 292     const Params *params() const
 293     { return reinterpret_cast<const Params *>(_params); }
 294     BaseCPU(Params *params, bool is_checker = false);
 295     virtual ~BaseCPU();
 296
 297     virtual void init();
 298     virtual void startup();
 299     virtual void regStats();
 300
 301     void regProbePoints() M5_ATTR_OVERRIDE;
 302
 303     void registerThreadContexts();
 304
 305     /**
 306      * Prepare for another CPU to take over execution.
 307      *
 308      * When this method exits, all internal state should have been
 309      * flushed. After the method returns, the simulator calls
 310      * takeOverFrom() on the new CPU with this CPU as its parameter.
 311      */
 312     virtual void switchOut();
 313
 314     /**
 315      * Load the state of a CPU from the previous CPU object, invoked
 316      * on all new CPUs that are about to be switched in.
 317      *
 318      * A CPU model implementing this method is expected to initialize
 319      * its state from the old CPU and connect its memory (unless they
 320      * are already connected) to the memories connected to the old
 321      * CPU.
 322      *
 323      * @param cpu CPU to initialize read state from.
 324      */
 325     virtual void takeOverFrom(BaseCPU *cpu);
 326
 327     /**
 328      * Flush all TLBs in the CPU.
 329      *
 330      * This method is mainly used to flush stale translations when
 331      * switching CPUs. It is also exported to the Python world to
 332      * allow it to request a TLB flush after draining the CPU to make
 333      * it easier to compare traces when debugging
 334      * handover/checkpointing.
 335      */
 336     void flushTLBs();
 337
 338     /**
 339      * Determine if the CPU is switched out.
 340      *
 341      * @return True if the CPU is switched out, false otherwise.
 342      */
 343     bool switchedOut() const { return _switchedOut; }
 344
 345     /**
 346      * Verify that the system is in a memory mode supported by the
 347      * CPU.
 348      *
 349      * Implementations are expected to query the system for the
 350      * current memory mode and ensure that it is what the CPU model
 351      * expects. If the check fails, the implementation should
 352      * terminate the simulation using fatal().
 353      */
 354     virtual void verifyMemoryMode() const { };
 355
 356     /**
 357      *  Number of threads we're actually simulating (<= SMT_MAX_THREADS).
 358      * This is a constant for the duration of the simulation.
 359      */
 360     ThreadID numThreads;
 361
 362     /**
 363      * Vector of per-thread instruction-based event queues.  Used for
 364      * scheduling events based on number of instructions committed by
 365      * a particular thread.
 366      */
 367     EventQueue **comInstEventQueue;
 368
 369     /**
 370      * Vector of per-thread load-based event queues.  Used for
 371      * scheduling events based on number of loads committed by
 372      *a particular thread.
 373      */
 374     EventQueue **comLoadEventQueue;
 375
 376     System *system;
 377
 378     /**
 379      * Get the cache line size of the system.
 380      */
 381     inline unsigned int cacheLineSize() const { return _cacheLineSize; }
 382
 383     /**
 384      * Serialize this object to the given output stream.
 385      *
 386      * @note CPU models should normally overload the serializeThread()
 387      * method instead of the serialize() method as this provides a
 388      * uniform data format for all CPU models and promotes better code
 389      * reuse.
 390      *
 391      * @param os The stream to serialize to.
 392      */
 393     void serialize(CheckpointOut &cp) const M5_ATTR_OVERRIDE;
 394
 395     /**
 396      * Reconstruct the state of this object from a checkpoint.
 397      *
 398      * @note CPU models should normally overload the
 399      * unserializeThread() method instead of the unserialize() method
 400      * as this provides a uniform data format for all CPU models and
 401      * promotes better code reuse.
 402
 403      * @param cp The checkpoint use.
 404      * @param section The section name of this object.
 405      */
 406     void unserialize(CheckpointIn &cp) M5_ATTR_OVERRIDE;
 407
 408     /**
 409      * Serialize a single thread.
 410      *
 411      * @param os The stream to serialize to.
 412      * @param tid ID of the current thread.
 413      */
 414     virtual void serializeThread(CheckpointOut &cp, ThreadID tid) const {};
 415
 416     /**
 417      * Unserialize one thread.
 418      *
 419      * @param cp The checkpoint use.
 420      * @param section The section name of this thread.
 421      * @param tid ID of the current thread.
 422      */
 423     virtual void unserializeThread(CheckpointIn &cp, ThreadID tid) {};
 424
 425     virtual Counter totalInsts() const = 0;
 426
 427     virtual Counter totalOps() const = 0;
 428
 429     /**
 430      * Schedule an event that exits the simulation loops after a
 431      * predefined number of instructions.
 432      *
 433      * This method is usually called from the configuration script to
 434      * get an exit event some time in the future. It is typically used
 435      * when the script wants to simulate for a specific number of
 436      * instructions rather than ticks.
 437      *
 438      * @param tid Thread monitor.
 439      * @param insts Number of instructions into the future.
 440      * @param cause Cause to signal in the exit event.
 441      */
 442     void scheduleInstStop(ThreadID tid, Counter insts, const char *cause);
 443
 444     /**
 445      * Schedule an event that exits the simulation loops after a
 446      * predefined number of load operations.
 447      *
 448      * This method is usually called from the configuration script to
 449      * get an exit event some time in the future. It is typically used
 450      * when the script wants to simulate for a specific number of
 451      * loads rather than ticks.
 452      *
 453      * @param tid Thread monitor.
 454      * @param loads Number of load instructions into the future.
 455      * @param cause Cause to signal in the exit event.
 456      */
 457     void scheduleLoadStop(ThreadID tid, Counter loads, const char *cause);
 458
 459   public:
 460     /**
 461      * @{
 462      * @name PMU Probe points.
 463      */
 464
 465     /**
 466      * Helper method to trigger PMU probes for a committed
 467      * instruction.
 468      *
 469      * @param inst Instruction that just committed
 470      */
 471     virtual void probeInstCommit(const StaticInstPtr &inst);
 472
 473     /**
 474      * Helper method to instantiate probe points belonging to this
 475      * object.
 476      *
 477      * @param name Name of the probe point.
 478      * @return A unique_ptr to the new probe point.
 479      */
 480     ProbePoints::PMUUPtr pmuProbePoint(const char *name);
 481
 482     /** CPU cycle counter */
 483     ProbePoints::PMUUPtr ppCycles;
 484
 485     /**
 486      * Instruction commit probe point.
 487      *
 488      * This probe point is triggered whenever one or more instructions
 489      * are committed. It is normally triggered once for every
 490      * instruction. However, CPU models committing bundles of
 491      * instructions may call notify once for the entire bundle.
 492      */
 493     ProbePoints::PMUUPtr ppRetiredInsts;
 494
 495     /** Retired load instructions */
 496     ProbePoints::PMUUPtr ppRetiredLoads;
 497     /** Retired store instructions */
 498     ProbePoints::PMUUPtr ppRetiredStores;
 499
 500     /** Retired branches (any type) */
 501     ProbePoints::PMUUPtr ppRetiredBranches;
 502
 503     /** @} */
 504
 505
 506
 507     // Function tracing
 508   private:
 509     bool functionTracingEnabled;
 510     std::ostream *functionTraceStream;
 511     Addr currentFunctionStart;
 512     Addr currentFunctionEnd;
 513     Tick functionEntryTick;
 514     void enableFunctionTrace();
 515     void traceFunctionsInternal(Addr pc);
 516
 517   private:
 518     static std::vector<BaseCPU *> cpuList;   //!< Static global cpu list
 519
 520   public:
 521     void traceFunctions(Addr pc)
 522     {
 523         if (functionTracingEnabled)
 524             traceFunctionsInternal(pc);
 525     }
 526
 527     static int numSimulatedCPUs() { return cpuList.size(); }
 528     static Counter numSimulatedInsts()
 529     {
 530         Counter total = 0;
 531
 532         int size = cpuList.size();
 533         for (int i = 0; i < size; ++i)
 534             total += cpuList[i]->totalInsts();
 535
 536         return total;
 537     }
 538
 539     static Counter numSimulatedOps()
 540     {
 541         Counter total = 0;
 542
 543         int size = cpuList.size();
 544         for (int i = 0; i < size; ++i)
 545             total += cpuList[i]->totalOps();
 546
 547         return total;
 548     }
 549
 550   public:
 551     // Number of CPU cycles simulated
 552     Stats::Scalar numCycles;
 553     Stats::Scalar numWorkItemsStarted;
 554     Stats::Scalar numWorkItemsCompleted;
 555
 556   private:
 557     AddressMonitor addressMonitor;
 558
 559   public:
 560     void armMonitor(Addr address);
 561     bool mwait(PacketPtr pkt);
 562     void mwaitAtomic(ThreadContext *tc, TheISA::TLB *dtb);
 563     AddressMonitor *getCpuAddrMonitor() { return &addressMonitor; }
 564     void atomicNotify(Addr address);
 565 };
 566
 567 #endif // THE_ISA == NULL_ISA
 568
 569 #endif // __CPU_BASE_HH__