kvm: Add experimental support for a perf-based execution timer
authorAndreas Sandberg <Andreas.Sandberg@ARM.com>
Mon, 22 Apr 2013 17:20:32 +0000 (13:20 -0400)
committerAndreas Sandberg <Andreas.Sandberg@ARM.com>
Mon, 22 Apr 2013 17:20:32 +0000 (13:20 -0400)
Add support for using the CPU cycle counter instead of a normal POSIX
timer to generate timed exits to gem5. This should, in theory, provide
better resolution when requesting timer signals.

The perf-based timer requires a fairly recent kernel since it requires
a working PERF_EVENT_IOC_PERIOD ioctl. This ioctl has existed in the
kernel for a long time, but it used to be completely broken due to an
inverted match when the kernel copied things from user
space. Additionally, the ioctl does not change the sample period
correctly on all kernel versions which implement it. It is currently
only known to work reliably on kernel version 3.7 and above on ARM.

src/cpu/kvm/BaseKvmCPU.py
src/cpu/kvm/base.cc
src/cpu/kvm/base.hh
src/cpu/kvm/perfevent.hh
src/cpu/kvm/timer.cc
src/cpu/kvm/timer.hh

index aa7ad4c2c49ade18b7b58c08c2ceeea93ce3d3a3..a8356ac5b9c49681793311fe156ef5da3d775958 100644 (file)
@@ -69,4 +69,5 @@ class BaseKvmCPU(BaseCPU):
         return True
 
     kvmVM = Param.KvmVM(Parent.any, 'KVM VM (i.e., shared memory domain)')
+    usePerfOverflow = Param.Bool(False, "Use perf event overflow counters (EXPERIMENTAL)")
     hostFactor = Param.Float(1.0, "Cycle scale factor")
index 89f5e0f5d5715274e0315b58990227533acc5272..2d993cf35f4498adb2ac2004396e857b66e072a9 100644 (file)
@@ -78,6 +78,7 @@ BaseKvmCPU::BaseKvmCPU(BaseKvmCPUParams *params)
       _kvmRun(NULL), mmioRing(NULL),
       pageSize(sysconf(_SC_PAGE_SIZE)),
       tickEvent(*this),
+      perfControlledByTimer(params->usePerfOverflow),
       hostFactor(params->hostFactor)
 {
     if (pageSize == -1)
@@ -93,9 +94,15 @@ BaseKvmCPU::BaseKvmCPU(BaseKvmCPUParams *params)
     setupCounters();
     setupSignalHandler();
 
-    runTimer.reset(new PosixKvmTimer(KVM_TIMER_SIGNAL, CLOCK_MONOTONIC,
-                                     params->hostFactor,
-                                     params->clock));
+    if (params->usePerfOverflow)
+        runTimer.reset(new PerfKvmTimer(hwCycles,
+                                        KVM_TIMER_SIGNAL,
+                                        params->hostFactor,
+                                        params->clock));
+    else
+        runTimer.reset(new PosixKvmTimer(KVM_TIMER_SIGNAL, CLOCK_MONOTONIC,
+                                         params->hostFactor,
+                                         params->clock));
 }
 
 BaseKvmCPU::~BaseKvmCPU()
@@ -450,15 +457,25 @@ BaseKvmCPU::kvmRun(Tick ticks)
 
     DPRINTF(KvmRun, "KVM: Executing for %i ticks\n", ticks);
     timerOverflowed = false;
+
+    // Arm the run timer and start the cycle timer if it isn't
+    // controlled by the overflow timer. Starting/stopping the cycle
+    // timer automatically starts the other perf timers as they are in
+    // the same counter group.
     runTimer->arm(ticks);
-    startCounters();
+    if (!perfControlledByTimer)
+        hwCycles.start();
+
     if (ioctl(KVM_RUN) == -1) {
         if (errno != EINTR)
             panic("KVM: Failed to start virtual CPU (errno: %i)\n",
                   errno);
     }
-    stopCounters();
+
     runTimer->disarm();
+    if (!perfControlledByTimer)
+        hwCycles.stop();
+
 
     uint64_t cyclesExecuted(hwCycles.read() - baseCycles);
     Tick ticksExecuted(runTimer->ticksFromHostCycles(cyclesExecuted));
@@ -821,6 +838,17 @@ BaseKvmCPU::setupCounters()
                                 PERF_COUNT_HW_CPU_CYCLES);
     cfgCycles.disabled(true)
         .pinned(true);
+
+    if (perfControlledByTimer) {
+        // We need to configure the cycles counter to send overflows
+        // since we are going to use it to trigger timer signals that
+        // trap back into m5 from KVM. In practice, this means that we
+        // need to set some non-zero sample period that gets
+        // overridden when the timer is armed.
+        cfgCycles.wakeupEvents(1)
+            .samplePeriod(42);
+    }
+
     hwCycles.attach(cfgCycles,
                     0); // TID (0 => currentThread)
 
@@ -831,18 +859,3 @@ BaseKvmCPU::setupCounters()
                           0, // TID (0 => currentThread)
                           hwCycles);
 }
-
-void
-BaseKvmCPU::startCounters()
-{
-    // We only need to start/stop the hwCycles counter since hwCycles
-    // and hwInstructions are a counter group with hwCycles as the
-    // group leader.
-    hwCycles.start();
-}
-
-void
-BaseKvmCPU::stopCounters()
-{
-    hwCycles.stop();
-}
index 90ebae64468be2b49c46662154f666680fd8d6f2..0554f913e83c1c1b85f5bba8871a70b43079cf4d 100644 (file)
@@ -460,12 +460,6 @@ class BaseKvmCPU : public BaseCPU
     /** Setup hardware performance counters */
     void setupCounters();
 
-    /** @{ */
-    /** Start/stop counting HW performance events */
-    void startCounters();
-    void stopCounters();
-    /** @} */
-
     /** KVM vCPU file descriptor */
     int vcpuFD;
     /** Size of MMAPed kvm_run area */
@@ -495,6 +489,15 @@ class BaseKvmCPU : public BaseCPU
     PerfKvmCounter hwInstructions;
     /** @} */
 
+    /**
+     * Does the runTimer control the performance counters?
+     *
+     * The run timer will automatically enable and disable performance
+     * counters if a PerfEvent-based timer is used to control KVM
+     * exits.
+     */
+    bool perfControlledByTimer;
+
     /**
      * Timer used to force execution into the monitor after a
      * specified number of simulation tick equivalents have executed
index 8242cc071d42aa0ca18f9b61c1f9b52000eec41d..eed900994a3db0c14f8cba0c58cd529bb3889a8b 100644 (file)
@@ -217,7 +217,8 @@ public:
      * like the new period isn't effective until after the next
      * counter overflow. If you use this method to change the sample
      * period, you will see one sample with the old period and then
-     * start sampling with the new period.
+     * start sampling with the new period. This problem was fixed for
+     * ARM in version 3.7 of the kernel.
      *
      * @warning This method doesn't work at all on some 2.6.3x kernels
      * since it has inverted check for the return value when copying
index 059d70f6bc9be29465073c012b5a237eebb393cb..e1f74a552e2eddcc50d672931961c3ffb0241633 100644 (file)
@@ -110,3 +110,37 @@ PosixKvmTimer::calcResolution()
 
     return resolution;
 }
+
+
+PerfKvmTimer::PerfKvmTimer(PerfKvmCounter &ctr,
+                           int signo, float hostFactor, Tick hostFreq)
+    : BaseKvmTimer(signo, hostFactor, hostFreq),
+      hwOverflow(ctr)
+{
+    hwOverflow.enableSignals(signo);
+}
+
+PerfKvmTimer::~PerfKvmTimer()
+{
+}
+
+void
+PerfKvmTimer::arm(Tick ticks)
+{
+    hwOverflow.period(hostCycles(ticks));
+    hwOverflow.refresh(1);
+}
+
+void
+PerfKvmTimer::disarm()
+{
+    hwOverflow.stop();
+}
+
+Tick
+PerfKvmTimer::calcResolution()
+{
+    // This is a bit arbitrary, but in practice, we can't really do
+    // anything useful in less than ~1000 anyway.
+    return ticksFromHostCycles(1000);
+}
index a5105e7faa423cdf5d0322c13ac8be802bc6874c..df60b7227b1b1dddd40d435e74596695aae98e16 100644 (file)
@@ -42,6 +42,7 @@
 
 #include <ctime>
 
+#include "cpu/kvm/perfevent.hh"
 #include "sim/core.hh"
 
 /**
@@ -203,4 +204,44 @@ class PosixKvmTimer : public BaseKvmTimer
     timer_t timer;
 };
 
+/**
+ * PerfEvent based timer using the host's CPU cycle counter.
+ *
+ * @warning There is a known problem in some versions of the PerfEvent
+ * API that prevents the counter overflow period from being updated
+ * reliably, which might break this timer. See PerfKvmCounter::period()
+ * for details.
+ */
+class PerfKvmTimer : public BaseKvmTimer
+{
+  public:
+    /**
+     * Create a timer that uses an existing hardware cycle counter.
+     *
+     * @note The performance counter must be configured for overflow
+     * sampling, which in practice means that it must have a non-zero
+     * sample period. The initial sample period is ignored since
+     * period will be updated when arm() is called.
+     *
+     * @param ctr Attached performance counter configured for overflow
+     *            reporting.
+     * @param signo Signal to deliver
+     * @param hostFactor Performance scaling factor
+     * @param hostFreq Clock frequency of the host
+     */
+    PerfKvmTimer(PerfKvmCounter &ctr,
+                 int signo,
+                 float hostFactor, Tick hostFreq);
+    ~PerfKvmTimer();
+
+    void arm(Tick ticks);
+    void disarm();
+
+  protected:
+    Tick calcResolution();
+
+  private:
+    PerfKvmCounter &hwOverflow;
+};
+
 #endif