ruby: patch checkpoint restore with garnet

author Nilay Vaish <nilay@cs.wisc.edu>

Tue, 23 Apr 2013 05:03:02 +0000 (00:03 -0500)

committer Nilay Vaish <nilay@cs.wisc.edu>

Tue, 23 Apr 2013 05:03:02 +0000 (00:03 -0500)
author Nilay Vaish <nilay@cs.wisc.edu>
Tue, 23 Apr 2013 05:03:02 +0000 (00:03 -0500)
committer Nilay Vaish <nilay@cs.wisc.edu>
Tue, 23 Apr 2013 05:03:02 +0000 (00:03 -0500)
diff --git a/src/mem/ruby/common/Global.cc b/src/mem/ruby/common/Global.cc

index 407e373075cd8a2c00eb79457e5064baea3c666b..3fdbd28b63a2a66b25ad36e7c7d0a25c7330bfa6 100644 (file)
--- a/src/mem/ruby/common/Global.cc
+++ b/src/mem/ruby/common/Global.cc
@@ -32,3 +32,4 @@ using namespace std;
  
  RubySystem* g_system_ptr = 0;
  vector<map<uint32_t, AbstractController *> > g_abs_controls;
+Cycles g_ruby_start;
diff --git a/src/mem/ruby/common/Global.hh b/src/mem/ruby/common/Global.hh

index 671f423f011040dc347e7a827d95733f4f8034ae..8282f5b015ac88a157abfc30c4e6f4496688c513 100644 (file)
--- a/src/mem/ruby/common/Global.hh
+++ b/src/mem/ruby/common/Global.hh
@@ -33,6 +33,7 @@
  #include <vector>
  
  #include "base/str.hh"
+#include "base/types.hh"
  
  class RubySystem;
  extern RubySystem* g_system_ptr;
@@ -40,5 +41,9 @@ extern RubySystem* g_system_ptr;
  class AbstractController;
  extern std::vector<std::map<uint32_t, AbstractController *> > g_abs_controls;
  
+// A globally visible time at which the actual execution started. Meant only
+// for components with in Ruby. Initialized in RubySystem::startup().
+extern Cycles g_ruby_start;
+
  #endif // __MEM_RUBY_COMMON_GLOBAL_HH__
  
diff --git a/src/mem/ruby/network/garnet/BaseGarnetNetwork.cc b/src/mem/ruby/network/garnet/BaseGarnetNetwork.cc

index 3b24ada4969f724c5d13d20a65fc4d14ed3d76cc..3e70900dc88debf62bbd76715b08bd7f6c6c48c4 100644 (file)
--- a/src/mem/ruby/network/garnet/BaseGarnetNetwork.cc
+++ b/src/mem/ruby/network/garnet/BaseGarnetNetwork.cc
@@ -36,7 +36,7 @@
  using namespace std;
  
  BaseGarnetNetwork::BaseGarnetNetwork(const Params *p)
-    : Network(p), m_ruby_start(0)
+    : Network(p)
  {
      m_ni_flit_size = p->ni_flit_size;
      m_vcs_per_vnet = p->vcs_per_vnet;
@@ -123,13 +123,6 @@ BaseGarnetNetwork::getFromNetQueue(NodeID id, bool ordered, int network_num,
  void
  BaseGarnetNetwork::clearStats()
  {
-    m_ruby_start = curCycle();
-}
-
-Cycles
-BaseGarnetNetwork::getRubyStartTime()
-{
-    return m_ruby_start;
  }
  
  void
diff --git a/src/mem/ruby/network/garnet/BaseGarnetNetwork.hh b/src/mem/ruby/network/garnet/BaseGarnetNetwork.hh

index 15e63925a25206b7b0a04ee15138e2136b3e12d9..b9f86df59bc91ce96fd1eda2fb3c32c3db93d885 100644 (file)
--- a/src/mem/ruby/network/garnet/BaseGarnetNetwork.hh
+++ b/src/mem/ruby/network/garnet/BaseGarnetNetwork.hh
@@ -80,7 +80,6 @@ class BaseGarnetNetwork : public Network
      virtual void checkNetworkAllocation(NodeID id, bool ordered,
          int network_num, std::string vnet_type) = 0;
  
-    Cycles getRubyStartTime();
      void clearStats();
      void printStats(std::ostream& out) const;
      void printPerformanceStats(std::ostream& out) const;
@@ -102,8 +101,6 @@ class BaseGarnetNetwork : public Network
  
      std::vector<std::vector<MessageBuffer*> > m_toNetQueues;
      std::vector<std::vector<MessageBuffer*> > m_fromNetQueues;
-
-    Cycles m_ruby_start;
  };
  
  #endif // __MEM_RUBY_NETWORK_GARNET_BASEGARNETNETWORK_HH__
diff --git a/src/mem/ruby/network/garnet/fixed-pipeline/GarnetNetwork_d.cc b/src/mem/ruby/network/garnet/fixed-pipeline/GarnetNetwork_d.cc

index c4965af17a7f21410c37f374409a487bb638598e..4b1e0d0d785f1b5831bf3267b602b5b71beaa066 100644 (file)
--- a/src/mem/ruby/network/garnet/fixed-pipeline/GarnetNetwork_d.cc
+++ b/src/mem/ruby/network/garnet/fixed-pipeline/GarnetNetwork_d.cc
@@ -270,7 +270,7 @@ GarnetNetwork_d::printLinkStats(ostream& out) const
      for (int i = 0; i < m_link_ptr_vector.size(); i++) {
          average_link_utilization +=
              (double(m_link_ptr_vector[i]->getLinkUtilization())) /
-            (double(curCycle() - m_ruby_start));
+            (double(curCycle() - g_ruby_start));
  
          vector<int> vc_load = m_link_ptr_vector[i]->getVcLoad();
          for (int j = 0; j < vc_load.size(); j++) {
@@ -289,7 +289,7 @@ GarnetNetwork_d::printLinkStats(ostream& out) const
              continue;
  
          average_vc_load[i] = (double(average_vc_load[i])) /
-            (double(curCycle() - m_ruby_start));
+            (double(curCycle() - g_ruby_start));
          out << "Average VC Load [" << i << "] = " << average_vc_load[i]
              << " flits/cycle " << endl;
      }
diff --git a/src/mem/ruby/network/garnet/fixed-pipeline/InputUnit_d.cc b/src/mem/ruby/network/garnet/fixed-pipeline/InputUnit_d.cc

index 7db9db56b02d77c0a23f853040d273e4ee7a4c55..82d89912e3c97b712f7a5eb7bad0ff5e09076de3 100644 (file)
--- a/src/mem/ruby/network/garnet/fixed-pipeline/InputUnit_d.cc
+++ b/src/mem/ruby/network/garnet/fixed-pipeline/InputUnit_d.cc
@@ -53,7 +53,7 @@ InputUnit_d::InputUnit_d(int id, Router_d *router) : Consumer(router)
      // Instantiating the virtual channels
      m_vcs.resize(m_num_vcs);
      for (int i=0; i < m_num_vcs; i++) {
-        m_vcs[i] = new VirtualChannel_d(i, m_router->curCycle());
+        m_vcs[i] = new VirtualChannel_d(i);
      }
  }
  
diff --git a/src/mem/ruby/network/garnet/fixed-pipeline/NetworkInterface_d.cc b/src/mem/ruby/network/garnet/fixed-pipeline/NetworkInterface_d.cc

index e49216476147cf0ffdde6e49f646aae4cb1f4a81..adf1c1a4dc4eb02367a4b2a12506a3d2e3d28025 100644 (file)
--- a/src/mem/ruby/network/garnet/fixed-pipeline/NetworkInterface_d.cc
+++ b/src/mem/ruby/network/garnet/fixed-pipeline/NetworkInterface_d.cc
@@ -71,7 +71,6 @@ NetworkInterface_d::NetworkInterface_d(int id, int virtual_networks,
  
      for (int i = 0; i < m_num_vcs; i++) {
          m_out_vc_state.push_back(new OutVcState_d(i, m_net_ptr));
-        m_out_vc_state[i]->setState(IDLE_, m_net_ptr->curCycle());
      }
  }
  
diff --git a/src/mem/ruby/network/garnet/fixed-pipeline/OutVcState_d.cc b/src/mem/ruby/network/garnet/fixed-pipeline/OutVcState_d.cc

index d006591c0faa445ffc5475945759d4cc5520dcce..a11bf0c2dcf16f5cb78f82f22f96a93dc8e5d248 100644 (file)
--- a/src/mem/ruby/network/garnet/fixed-pipeline/OutVcState_d.cc
+++ b/src/mem/ruby/network/garnet/fixed-pipeline/OutVcState_d.cc
@@ -33,16 +33,15 @@
  #include "mem/ruby/system/System.hh"
  
  OutVcState_d::OutVcState_d(int id, GarnetNetwork_d *network_ptr)
+    : m_time(0)
  {
-    m_network_ptr = network_ptr;
      m_id = id;
      m_vc_state = IDLE_;
-    m_time = m_network_ptr->curCycle();
  
-    if (m_network_ptr->get_vnet_type(id) == DATA_VNET_)
-        m_credit_count = m_network_ptr->getBuffersPerDataVC();
+    if (network_ptr->get_vnet_type(id) == DATA_VNET_)
+        m_credit_count = network_ptr->getBuffersPerDataVC();
      else
-        m_credit_count = m_network_ptr->getBuffersPerCtrlVC();
+        m_credit_count = network_ptr->getBuffersPerCtrlVC();
  
      assert(m_credit_count >= 1);
  }
diff --git a/src/mem/ruby/network/garnet/fixed-pipeline/OutVcState_d.hh b/src/mem/ruby/network/garnet/fixed-pipeline/OutVcState_d.hh

index 07b197cf59d9fffca704e0a8612cd16e253d3efc..08ceecec0115e2bf15b57966a8ea2156138203e7 100644 (file)
--- a/src/mem/ruby/network/garnet/fixed-pipeline/OutVcState_d.hh
+++ b/src/mem/ruby/network/garnet/fixed-pipeline/OutVcState_d.hh
@@ -61,7 +61,6 @@ class OutVcState_d
      inline void decrement_credit()  { m_credit_count--; }
  
    private:
-    GarnetNetwork_d *m_network_ptr;
      int m_id ;
      Cycles m_time;
      VC_state_type m_vc_state;
diff --git a/src/mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.cc b/src/mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.cc

index bfeecbc25e0e4ba393618786b9f72003075e05be..510a79e8dc14b7420a985a083ee2b0a8b4a68d99 100644 (file)
--- a/src/mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.cc
+++ b/src/mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.cc
@@ -30,13 +30,13 @@
  
  #include "mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.hh"
  
-VirtualChannel_d::VirtualChannel_d(int id, Cycles curTime)
+VirtualChannel_d::VirtualChannel_d(int id)
      : m_enqueue_time(INFINITE_)
  {
      m_id = id;
      m_input_buffer = new flitBuffer_d();
      m_vc_state.first = IDLE_;
-    m_vc_state.second = curTime;
+    m_vc_state.second = Cycles(0);
  }
  
  VirtualChannel_d::~VirtualChannel_d()
diff --git a/src/mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.hh b/src/mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.hh

index 9e8b95d9d0b8625eb2ccda0cf0a059ffd9217799..d196303053ea6aeb7ed466825f46f8350ba578fc 100644 (file)
--- a/src/mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.hh
+++ b/src/mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.hh
@@ -39,7 +39,7 @@
  class VirtualChannel_d
  {
    public:
-    VirtualChannel_d(int id, Cycles curTime);
+    VirtualChannel_d(int id);
      ~VirtualChannel_d();
  
      bool need_stage(VC_state_type state, flit_stage stage, Cycles curTime);
diff --git a/src/mem/ruby/network/garnet/flexible-pipeline/GarnetNetwork.cc b/src/mem/ruby/network/garnet/flexible-pipeline/GarnetNetwork.cc

index ed75a26d1221d8865b25f79fea1d16a7dad4d48a..ee54dc2c5ce9844f4eb47277c490a2641b0a1fb0 100644 (file)
--- a/src/mem/ruby/network/garnet/flexible-pipeline/GarnetNetwork.cc
+++ b/src/mem/ruby/network/garnet/flexible-pipeline/GarnetNetwork.cc
@@ -254,7 +254,7 @@ GarnetNetwork::printLinkStats(ostream& out) const
      for (int i = 0; i < m_link_ptr_vector.size(); i++) {
          average_link_utilization +=
              (double(m_link_ptr_vector[i]->getLinkUtilization())) /
-            (double(curCycle() - m_ruby_start));
+            (double(curCycle() - g_ruby_start));
  
          vector<int> vc_load = m_link_ptr_vector[i]->getVcLoad();
          for (int j = 0; j < vc_load.size(); j++) {
@@ -273,7 +273,7 @@ GarnetNetwork::printLinkStats(ostream& out) const
              continue;
  
          average_vc_load[i] = double(average_vc_load[i]) /
-            (double(curCycle() - m_ruby_start));
+            (double(curCycle() - g_ruby_start));
          out << "Average VC Load [" << i << "] = " << average_vc_load[i]
              << " flits/cycle " << endl;
      }
diff --git a/src/mem/ruby/network/garnet/flexible-pipeline/NetworkInterface.cc b/src/mem/ruby/network/garnet/flexible-pipeline/NetworkInterface.cc

index 870560af0fa5da1a331fdfcae63b540789286393..09e0685571275e4af364d72548d6feadf0df61b6 100644 (file)
--- a/src/mem/ruby/network/garnet/flexible-pipeline/NetworkInterface.cc
+++ b/src/mem/ruby/network/garnet/flexible-pipeline/NetworkInterface.cc
@@ -68,7 +68,6 @@ NetworkInterface::NetworkInterface(int id, int virtual_networks,
  
      for (int i = 0; i < m_num_vcs; i++) {
          m_out_vc_state.push_back(new OutVcState(i));
-        m_out_vc_state[i]->setState(IDLE_, m_net_ptr->curCycle());
      }
  }
  
diff --git a/src/mem/ruby/network/garnet/flexible-pipeline/OutVcState.cc b/src/mem/ruby/network/garnet/flexible-pipeline/OutVcState.cc

index e08f7f93afad17d93d8b9d563d1bf87cafcd6c58..114baa5cd968b64b61a8e52b63e2e00407ea9268 100644 (file)
--- a/src/mem/ruby/network/garnet/flexible-pipeline/OutVcState.cc
+++ b/src/mem/ruby/network/garnet/flexible-pipeline/OutVcState.cc
@@ -31,6 +31,7 @@
  #include "mem/ruby/network/garnet/flexible-pipeline/OutVcState.hh"
  
  OutVcState::OutVcState(int id)
+    : m_time(0)
  {
      m_id = id;
      m_vc_state = IDLE_;
diff --git a/src/mem/ruby/network/orion/NetworkPower.cc b/src/mem/ruby/network/orion/NetworkPower.cc

index 6d4fc19234fa8f1f9d11b3d2ab71dd85d69f435b..c58d64a17c7b21c107a688636e1a15dedbfab787 100644 (file)
--- a/src/mem/ruby/network/orion/NetworkPower.cc
+++ b/src/mem/ruby/network/orion/NetworkPower.cc
@@ -39,7 +39,7 @@ Router_d::calculate_power()
  {
      //Network Activities from garnet
      calculate_performance_numbers();
-    double sim_cycles = curCycle() - m_network_ptr->getRubyStartTime();
+    double sim_cycles = curCycle() - g_ruby_start;
  
      // Number of virtual networks/message classes declared in Ruby
      // maybe greater than active virtual networks.
@@ -245,8 +245,7 @@ NetworkLink_d::calculate_power()
          channel_width_bits,
          orion_cfg_ptr);
  
-    double sim_cycles =
-        (double)(m_net_ptr->curCycle() - m_net_ptr->getRubyStartTime());
+    double sim_cycles = (double)(m_net_ptr->curCycle() - g_ruby_start);
  
      // Dynamic Power
      // Assume half the bits flipped on every link activity
diff --git a/src/mem/ruby/profiler/Profiler.cc b/src/mem/ruby/profiler/Profiler.cc

index 4d05a5698d7b3c92a8f94adb834f595b8c42b631..e9c2aed2985630fec1bdf77eadcd987ca0c02948 100644 (file)
--- a/src/mem/ruby/profiler/Profiler.cc
+++ b/src/mem/ruby/profiler/Profiler.cc
@@ -515,11 +515,7 @@ Profiler::clearStats()
  
      m_cycles_executed_at_start.resize(m_num_of_sequencers);
      for (int i = 0; i < m_num_of_sequencers; i++) {
-        if (g_system_ptr == NULL) {
-            m_cycles_executed_at_start[i] = 0;
-        } else {
-            m_cycles_executed_at_start[i] = g_system_ptr->curCycle();
-        }
+        m_cycles_executed_at_start[i] = g_system_ptr->curCycle();
      }
  
      m_busyBankCount = 0;
diff --git a/src/mem/ruby/system/System.cc b/src/mem/ruby/system/System.cc

index 617788b9968dff368d03f0f0b98da6d7d82e5619..357511127f69ea3441e1be26170592b6317200e8 100644 (file)
--- a/src/mem/ruby/system/System.cc
+++ b/src/mem/ruby/system/System.cc
@@ -93,13 +93,6 @@ RubySystem::RubySystem(const Params *p)
      g_abs_controls.resize(MachineType_NUM);
  }
  
-void
-RubySystem::init()
-{
-    m_profiler_ptr->clearStats();
-    m_network_ptr->clearStats();
-}
-
  void
  RubySystem::registerNetwork(Network* network_ptr)
  {
@@ -311,12 +304,6 @@ RubySystem::readCompressedTrace(string filename, uint8_t *&raw_data,
  void
  RubySystem::unserialize(Checkpoint *cp, const string &section)
  {
-    //
-    // The main purpose for clearing stats in the unserialize process is so
-    // that the profiler can correctly set its start time to the unserialized
-    // value of curTick()
-    //
-    resetStats();
      uint8_t *uncompressed_trace = NULL;
  
      if (m_mem_vec_ptr != NULL) {
@@ -368,6 +355,23 @@ RubySystem::unserialize(Checkpoint *cp, const string &section)
  void
  RubySystem::startup()
  {
+
+    // Ruby restores state from a checkpoint by resetting the clock to 0 and
+    // playing the requests that can possibly re-generate the cache state.
+    // The clock value is set to the actual checkpointed value once all the
+    // requests have been executed.
+    //
+    // This way of restoring state is pretty finicky. For example, if a
+    // Ruby component reads time before the state has been restored, it would
+    // cache this value and hence its clock would not be reset to 0, when
+    // Ruby resets the global clock. This can potentially result in a
+    // deadlock.
+    //
+    // The solution is that no Ruby component should read time before the
+    // simulation starts. And then one also needs to hope that the time
+    // Ruby finishes restoring the state is less than the time when the
+    // state was checkpointed.
+
      if (m_warmup_enabled) {
          // save the current tick value
          Tick curtick_original = curTick();
@@ -397,6 +401,8 @@ RubySystem::startup()
          setCurTick(curtick_original);
          resetClock();
      }
+
+    resetStats();
  }
  
  void
@@ -417,6 +423,8 @@ RubySystem::resetStats()
      for (uint32_t cntrl = 0; cntrl < m_abs_cntrl_vec.size(); cntrl++) {
          m_abs_cntrl_vec[cntrl]->clearStats();
      }
+
+    g_ruby_start = curCycle();
  }
  
  bool
diff --git a/src/mem/ruby/system/System.hh b/src/mem/ruby/system/System.hh

index 1e0be6da7ef1b03c347f54bc8304fc90c06f9062..ea55a23e09f2bbbcbd6d722b7c77ec0fb09a8be6 100644 (file)
--- a/src/mem/ruby/system/System.hh
+++ b/src/mem/ruby/system/System.hh
@@ -134,8 +134,6 @@ class RubySystem : public ClockedObject
      RubySystem(const RubySystem& obj);
      RubySystem& operator=(const RubySystem& obj);
  
-    void init();
-
      void readCompressedTrace(std::string filename,
                               uint8_t *&raw_data,
                               uint64& uncompressed_trace_size);
author	Nilay Vaish <nilay@cs.wisc.edu>
	Tue, 23 Apr 2013 05:03:02 +0000 (00:03 -0500)
committer	Nilay Vaish <nilay@cs.wisc.edu>
	Tue, 23 Apr 2013 05:03:02 +0000 (00:03 -0500)
src/mem/ruby/common/Global.cc		patch \| blob \| history
src/mem/ruby/common/Global.hh		patch \| blob \| history
src/mem/ruby/network/garnet/BaseGarnetNetwork.cc		patch \| blob \| history
src/mem/ruby/network/garnet/BaseGarnetNetwork.hh		patch \| blob \| history
src/mem/ruby/network/garnet/fixed-pipeline/GarnetNetwork_d.cc		patch \| blob \| history
src/mem/ruby/network/garnet/fixed-pipeline/InputUnit_d.cc		patch \| blob \| history
src/mem/ruby/network/garnet/fixed-pipeline/NetworkInterface_d.cc		patch \| blob \| history
src/mem/ruby/network/garnet/fixed-pipeline/OutVcState_d.cc		patch \| blob \| history
src/mem/ruby/network/garnet/fixed-pipeline/OutVcState_d.hh		patch \| blob \| history
src/mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.cc		patch \| blob \| history
src/mem/ruby/network/garnet/fixed-pipeline/VirtualChannel_d.hh		patch \| blob \| history
src/mem/ruby/network/garnet/flexible-pipeline/GarnetNetwork.cc		patch \| blob \| history
src/mem/ruby/network/garnet/flexible-pipeline/NetworkInterface.cc		patch \| blob \| history
src/mem/ruby/network/garnet/flexible-pipeline/OutVcState.cc		patch \| blob \| history
src/mem/ruby/network/orion/NetworkPower.cc		patch \| blob \| history
src/mem/ruby/profiler/Profiler.cc		patch \| blob \| history
src/mem/ruby/system/System.cc		patch \| blob \| history
src/mem/ruby/system/System.hh		patch \| blob \| history