mem-cache: Support for page crossing prefetches

author Javier Bueno <javier.bueno@metempsy.com>

Tue, 27 Nov 2018 15:15:53 +0000 (16:15 +0100)

committer Javier Bueno Hedo <javier.bueno@metempsy.com>

Wed, 29 May 2019 08:55:39 +0000 (08:55 +0000)
author Javier Bueno <javier.bueno@metempsy.com>
Tue, 27 Nov 2018 15:15:53 +0000 (16:15 +0100)
committer Javier Bueno Hedo <javier.bueno@metempsy.com>
Wed, 29 May 2019 08:55:39 +0000 (08:55 +0000)
diff --git a/src/mem/cache/prefetch/Prefetcher.py b/src/mem/cache/prefetch/Prefetcher.py

index 3810b6afd3d6856fa42d6fa19e9ec9d397425ff7..bf735264ae016ed038e4088b495541631d7f1f41 100644 (file)
--- a/src/mem/cache/prefetch/Prefetcher.py
+++ b/src/mem/cache/prefetch/Prefetcher.py
@@ -65,6 +65,7 @@ class BasePrefetcher(ClockedObject):
      cxx_header = "mem/cache/prefetch/base.hh"
      cxx_exports = [
          PyBindMethod("addEventProbe"),
+        PyBindMethod("addTLB"),
      ]
      sys = Param.System(Parent.any, "System this prefetcher belongs to")
  
@@ -88,6 +89,8 @@ class BasePrefetcher(ClockedObject):
      # Override the normal SimObject::regProbeListeners method and
      # register deferred event handlers.
      def regProbeListeners(self):
+        for tlb in self._tlbs:
+            self.getCCObject().addTLB(tlb.getCCObject())
          for event in self._events:
             event.register()
          self.getCCObject().regProbeListeners()
@@ -98,6 +101,11 @@ class BasePrefetcher(ClockedObject):
          if len(probeNames) <= 0:
              raise TypeError("probeNames must have at least one element")
          self.addEvent(HWPProbeEvent(self, simObj, *probeNames))
+    _tlbs = []
+    def registerTLB(self, simObj):
+        if not isinstance(simObj, SimObject):
+            raise TypeError("argument must be a SimObject type")
+        self._tlbs.append(simObj)
  
  class MultiPrefetcher(BasePrefetcher):
      type = 'MultiPrefetcher'
@@ -113,6 +121,8 @@ class QueuedPrefetcher(BasePrefetcher):
      cxx_header = "mem/cache/prefetch/queued.hh"
      latency = Param.Int(1, "Latency for generated prefetches")
      queue_size = Param.Int(32, "Maximum number of queued prefetches")
+    max_prefetch_requests_with_pending_translation = Param.Int(32,
+        "Maximum number of queued prefetches that have a missing translation")
      queue_squash = Param.Bool(True, "Squash queued prefetch on demand access")
      queue_filter = Param.Bool(True, "Don't queue redundant prefetches")
      cache_snoop = Param.Bool(False, "Snoop cache to eliminate redundant request")
diff --git a/src/mem/cache/prefetch/base.cc b/src/mem/cache/prefetch/base.cc

index 3664892276ede32f60fdbb3f61db4915cae7ac5a..b3a43cc582ecea5744316889241d9381ac3559a2 100644 (file)
--- a/src/mem/cache/prefetch/base.cc
+++ b/src/mem/cache/prefetch/base.cc
@@ -96,7 +96,7 @@ BasePrefetcher::BasePrefetcher(const BasePrefetcherParams *p)
        masterId(p->sys->getMasterId(this)), pageBytes(p->sys->getPageBytes()),
        prefetchOnAccess(p->prefetch_on_access),
        useVirtualAddresses(p->use_virtual_addresses), issuedPrefetches(0),
-      usefulPrefetches(0)
+      usefulPrefetches(0), tlb(nullptr)
  {
  }
  
@@ -254,3 +254,10 @@ BasePrefetcher::addEventProbe(SimObject *obj, const char *name)
      ProbeManager *pm(obj->getProbeManager());
      listeners.push_back(new PrefetchListener(*this, pm, name));
  }
+
+void
+BasePrefetcher::addTLB(BaseTLB *t)
+{
+    fatal_if(tlb != nullptr, "Only one TLB can be registered");
+    tlb = t;
+}
diff --git a/src/mem/cache/prefetch/base.hh b/src/mem/cache/prefetch/base.hh

index f4a61b21a34c394cc8add8029e066059edb46a24..e31dbfd4017022aa87c939a933f939dd57c0a782 100644 (file)
--- a/src/mem/cache/prefetch/base.hh
+++ b/src/mem/cache/prefetch/base.hh
@@ -52,6 +52,7 @@
  #include <cstdint>
  
  #include "arch/isa_traits.hh"
+#include "arch/generic/tlb.hh"
  #include "base/statistics.hh"
  #include "base/types.hh"
  #include "mem/packet.hh"
@@ -326,6 +327,9 @@ class BasePrefetcher : public ClockedObject
      /** Total prefetches that has been useful */
      uint64_t usefulPrefetches;
  
+    /** Registered tlb for address translations */
+    BaseTLB * tlb;
+
    public:
  
      BasePrefetcher(const BasePrefetcherParams *p);
@@ -371,5 +375,13 @@ class BasePrefetcher : public ClockedObject
       * @param name The probe name
       */
      void addEventProbe(SimObject *obj, const char *name);
+
+    /**
+     * Add a BaseTLB object to be used whenever a translation is needed.
+     * This is generally required when the prefetcher is allowed to generate
+     * page crossing references and/or uses virtual addresses for training.
+     * @param tlb pointer to the BaseTLB object to add
+     */
+    void addTLB(BaseTLB *tlb);
  };
  #endif //__MEM_CACHE_PREFETCH_BASE_HH__
diff --git a/src/mem/cache/prefetch/queued.cc b/src/mem/cache/prefetch/queued.cc

index d7b8aacd08689dc41c02d0ee04c6743395930ec2..12f4a3601137878e71f6c48817cb5d6f91fd3b18 100644 (file)
--- a/src/mem/cache/prefetch/queued.cc
+++ b/src/mem/cache/prefetch/queued.cc
@@ -41,18 +41,63 @@
  
  #include <cassert>
  
+#include "arch/generic/tlb.hh"
  #include "base/logging.hh"
  #include "base/trace.hh"
  #include "debug/HWPrefetch.hh"
+#include "mem/cache/base.hh"
  #include "mem/request.hh"
  #include "params/QueuedPrefetcher.hh"
  
-QueuedPrefetcher::QueuedPrefetcher(const QueuedPrefetcherParams *p)
-    : BasePrefetcher(p), queueSize(p->queue_size), latency(p->latency),
-      queueSquash(p->queue_squash), queueFilter(p->queue_filter),
-      cacheSnoop(p->cache_snoop), tagPrefetch(p->tag_prefetch)
+void
+QueuedPrefetcher::DeferredPacket::createPkt(Addr paddr, unsigned blk_size,
+                                            MasterID mid, bool tag_prefetch,
+                                            Tick t) {
+    /* Create a prefetch memory request */
+    RequestPtr req = std::make_shared<Request>(paddr, blk_size, 0, mid);
+
+    if (pfInfo.isSecure()) {
+        req->setFlags(Request::SECURE);
+    }
+    req->taskId(ContextSwitchTaskId::Prefetcher);
+    pkt = new Packet(req, MemCmd::HardPFReq);
+    pkt->allocate();
+    if (tag_prefetch && pfInfo.hasPC()) {
+        // Tag prefetch packet with  accessing pc
+        pkt->req->setPC(pfInfo.getPC());
+    }
+    tick = t;
+}
+
+void
+QueuedPrefetcher::DeferredPacket::startTranslation(BaseTLB *tlb)
  {
+    assert(translationRequest != nullptr);
+    if (!ongoingTranslation) {
+        ongoingTranslation = true;
+        // Prefetchers only operate in Timing mode
+        tlb->translateTiming(translationRequest, tc, this, BaseTLB::Read);
+    }
+}
  
+void
+QueuedPrefetcher::DeferredPacket::finish(const Fault &fault,
+    const RequestPtr &req, ThreadContext *tc, BaseTLB::Mode mode)
+{
+    assert(ongoingTranslation);
+    ongoingTranslation = false;
+    bool failed = (fault != NoFault);
+    owner->translationComplete(this, failed);
+}
+
+QueuedPrefetcher::QueuedPrefetcher(const QueuedPrefetcherParams *p)
+    : BasePrefetcher(p), queueSize(p->queue_size),
+      missingTranslationQueueSize(
+        p->max_prefetch_requests_with_pending_translation),
+      latency(p->latency), queueSquash(p->queue_squash),
+      queueFilter(p->queue_filter), cacheSnoop(p->cache_snoop),
+      tagPrefetch(p->tag_prefetch)
+{
  }
  
  QueuedPrefetcher::~QueuedPrefetcher()
@@ -93,18 +138,19 @@ QueuedPrefetcher::notify(const PacketPtr &pkt, const PrefetchInfo &pfi)
          // Block align prefetch address
          addr_prio.first = blockAddress(addr_prio.first);
  
-        if (samePage(pfi.getAddr(), addr_prio.first)) {
-            PrefetchInfo new_pfi(pfi,addr_prio.first);
+        if (!samePage(addr_prio.first, pfi.getAddr())) {
+            pfSpanPage += 1;
+        }
  
+        bool can_cross_page = (tlb != nullptr);
+        if (can_cross_page || samePage(addr_prio.first, pfi.getAddr())) {
+            PrefetchInfo new_pfi(pfi,addr_prio.first);
              pfIdentified++;
              DPRINTF(HWPrefetch, "Found a pf candidate addr: %#x, "
                      "inserting into prefetch queue.\n", new_pfi.getAddr());
-
              // Create and insert the request
              insert(pkt, new_pfi, addr_prio.second);
          } else {
-            // Record the number of page crossing prefetches generate
-            pfSpanPage += 1;
              DPRINTF(HWPrefetch, "Ignoring page crossing prefetch.\n");
          }
      }
@@ -115,6 +161,12 @@ QueuedPrefetcher::getPacket()
  {
      DPRINTF(HWPrefetch, "Requesting a prefetch to issue.\n");
  
+    if (pfq.empty()) {
+        // If the queue is empty, attempt first to fill it with requests
+        // from the queue of missing translations
+        processMissingTranslations(queueSize);
+    }
+
      if (pfq.empty()) {
          DPRINTF(HWPrefetch, "No hardware prefetches available.\n");
          return nullptr;
@@ -127,27 +179,9 @@ QueuedPrefetcher::getPacket()
      issuedPrefetches += 1;
      assert(pkt != nullptr);
      DPRINTF(HWPrefetch, "Generating prefetch for %#x.\n", pkt->getAddr());
-    return pkt;
-}
  
-QueuedPrefetcher::const_iterator
-QueuedPrefetcher::inPrefetch(const PrefetchInfo &pfi) const
-{
-    for (const_iterator dp = pfq.begin(); dp != pfq.end(); dp++) {
-        if (dp->pfInfo.sameAddr(pfi)) return dp;
-    }
-
-    return pfq.end();
-}
-
-QueuedPrefetcher::iterator
-QueuedPrefetcher::inPrefetch(const PrefetchInfo &pfi)
-{
-    for (iterator dp = pfq.begin(); dp != pfq.end(); dp++) {
-        if (dp->pfInfo.sameAddr(pfi)) return dp;
-    }
-
-    return pfq.end();
+    processMissingTranslations(queueSize - pfq.size());
+    return pkt;
  }
  
  void
@@ -173,7 +207,106 @@ QueuedPrefetcher::regStats()
  
      pfSpanPage
          .name(name() + ".pfSpanPage")
-        .desc("number of prefetches not generated due to page crossing");
+        .desc("number of prefetches that crossed the page");
+}
+
+
+void
+QueuedPrefetcher::processMissingTranslations(unsigned max)
+{
+    unsigned count = 0;
+    iterator it = pfqMissingTranslation.begin();
+    while (it != pfqMissingTranslation.end() && count < max) {
+        DeferredPacket &dp = *it;
+        // Increase the iterator first because dp.startTranslation can end up
+        // calling finishTranslation, which will erase "it"
+        it++;
+        dp.startTranslation(tlb);
+        count += 1;
+    }
+}
+
+void
+QueuedPrefetcher::translationComplete(DeferredPacket *dp, bool failed)
+{
+    auto it = pfqMissingTranslation.begin();
+    while (it != pfqMissingTranslation.end()) {
+        if (&(*it) == dp) {
+            break;
+        }
+        it++;
+    }
+    assert(it != pfqMissingTranslation.end());
+    if (!failed) {
+        DPRINTF(HWPrefetch, "%s Translation of vaddr %#x succeeded: "
+                "paddr %#x \n", tlb->name(),
+                it->translationRequest->getVaddr(),
+                it->translationRequest->getPaddr());
+        Addr target_paddr = it->translationRequest->getPaddr();
+        // check if this prefetch is already redundant
+        if (cacheSnoop && (inCache(target_paddr, it->pfInfo.isSecure()) ||
+                    inMissQueue(target_paddr, it->pfInfo.isSecure()))) {
+            pfInCache++;
+            DPRINTF(HWPrefetch, "Dropping redundant in "
+                    "cache/MSHR prefetch addr:%#x\n", target_paddr);
+        } else {
+            Tick pf_time = curTick() + clockPeriod() * latency;
+            it->createPkt(it->translationRequest->getPaddr(), blkSize,
+                    masterId, tagPrefetch, pf_time);
+            addToQueue(pfq, *it);
+        }
+    } else {
+        DPRINTF(HWPrefetch, "%s Translation of vaddr %#x failed, dropping "
+                "prefetch request %#x \n", tlb->name(),
+                it->translationRequest->getVaddr());
+    }
+    pfqMissingTranslation.erase(it);
+}
+
+bool
+QueuedPrefetcher::alreadyInQueue(std::list<DeferredPacket> &queue,
+                                 const PrefetchInfo &pfi, int32_t priority)
+{
+    bool found = false;
+    iterator it;
+    for (it = queue.begin(); it != queue.end() && !found; it++) {
+        found = it->pfInfo.sameAddr(pfi);
+    }
+
+    /* If the address is already in the queue, update priority and leave */
+    if (it != queue.end()) {
+        pfBufferHit++;
+        if (it->priority < priority) {
+            /* Update priority value and position in the queue */
+            it->priority = priority;
+            iterator prev = it;
+            while (prev != queue.begin()) {
+                prev--;
+                /* If the packet has higher priority, swap */
+                if (*it > *prev) {
+                    std::swap(*it, *prev);
+                    it = prev;
+                }
+            }
+            DPRINTF(HWPrefetch, "Prefetch addr already in "
+                "prefetch queue, priority updated\n");
+        } else {
+            DPRINTF(HWPrefetch, "Prefetch addr already in "
+                "prefetch queue\n");
+        }
+    }
+    return found;
+}
+
+RequestPtr
+QueuedPrefetcher::createPrefetchRequest(Addr addr, PrefetchInfo const &pfi,
+                                        PacketPtr pkt)
+{
+    RequestPtr translation_req = std::make_shared<Request>(pkt->req->getAsid(),
+            addr, blkSize, pkt->req->getFlags(), masterId, pfi.getPC(),
+            pkt->req->contextId());
+    translation_req->setFlags(Request::PREFETCH);
+    return translation_req;
  }
  
  void
@@ -181,84 +314,118 @@ QueuedPrefetcher::insert(const PacketPtr &pkt, PrefetchInfo &new_pfi,
                           int32_t priority)
  {
      if (queueFilter) {
-        iterator it = inPrefetch(new_pfi);
-        /* If the address is already in the queue, update priority and leave */
-        if (it != pfq.end()) {
-            pfBufferHit++;
-            if (it->priority < priority) {
-                /* Update priority value and position in the queue */
-                it->priority = priority;
-                iterator prev = it;
-                bool cont = true;
-                while (cont && prev != pfq.begin()) {
-                    prev--;
-                    /* If the packet has higher priority, swap */
-                    if (*it > *prev) {
-                        std::swap(*it, *prev);
-                        it = prev;
-                    }
-                }
-                DPRINTF(HWPrefetch, "Prefetch addr already in "
-                    "prefetch queue, priority updated\n");
-            } else {
-                DPRINTF(HWPrefetch, "Prefetch addr already in "
-                    "prefetch queue\n");
-            }
+        if (alreadyInQueue(pfq, new_pfi, priority)) {
+            return;
+        }
+        if (alreadyInQueue(pfqMissingTranslation, new_pfi, priority)) {
              return;
          }
      }
  
-    Addr target_addr = new_pfi.getAddr();
-    if (useVirtualAddresses) {
-        assert(pkt->req->hasPaddr());
-        //if we trained with virtual addresses, compute the phsysical address
-        if (new_pfi.getAddr() >= pkt->req->getVaddr()) {
-            //positive stride
-            target_addr = pkt->req->getPaddr() +
-                (new_pfi.getAddr() - pkt->req->getVaddr());
+    /*
+     * Physical address computation
+     * if the prefetch is within the same page
+     *   using VA: add the computed stride to the original PA
+     *   using PA: no actions needed
+     * if we are page crossing
+     *   using VA: Create a translaion request and enqueue the corresponding
+     *       deferred packet to the queue of pending translations
+     *   using PA: use the provided VA to obtain the target VA, then attempt to
+     *     translate the resulting address
+     */
+
+    Addr orig_addr = useVirtualAddresses ?
+        pkt->req->getVaddr() : pkt->req->getPaddr();
+    bool positive_stride = new_pfi.getAddr() >= orig_addr;
+    Addr stride = positive_stride ?
+        (new_pfi.getAddr() - orig_addr) : (orig_addr - new_pfi.getAddr());
+
+    Addr target_paddr;
+    bool has_target_pa = false;
+    RequestPtr translation_req = nullptr;
+    if (samePage(orig_addr, new_pfi.getAddr())) {
+        if (useVirtualAddresses) {
+            // if we trained with virtual addresses,
+            // compute the target PA using the original PA and adding the
+            // prefetch stride (difference between target VA and original VA)
+            target_paddr = positive_stride ? (pkt->req->getPaddr() + stride) :
+                (pkt->req->getPaddr() - stride);
          } else {
-            //negative stride
-            target_addr = pkt->req->getPaddr() -
-                (pkt->req->getVaddr() - new_pfi.getAddr());
+            target_paddr = new_pfi.getAddr();
          }
-    }
+        has_target_pa = true;
+    } else {
+        // Page crossing reference
  
-    if (cacheSnoop && (inCache(target_addr, new_pfi.isSecure()) ||
-                inMissQueue(target_addr, new_pfi.isSecure()))) {
+        // ContextID is needed for translation
+        if (!pkt->req->hasContextId()) {
+            return;
+        }
+        if (useVirtualAddresses) {
+            has_target_pa = false;
+            translation_req = createPrefetchRequest(new_pfi.getAddr(), new_pfi,
+                                                    pkt);
+        } else if (pkt->req->hasVaddr()) {
+            has_target_pa = false;
+            // Compute the target VA using req->getVaddr + stride
+            Addr target_vaddr = positive_stride ?
+                (pkt->req->getVaddr() + stride) :
+                (pkt->req->getVaddr() - stride);
+            translation_req = createPrefetchRequest(target_vaddr, new_pfi,
+                                                    pkt);
+        } else {
+            // Using PA for training but the request does not have a VA,
+            // unable to process this page crossing prefetch.
+            return;
+        }
+    }
+    if (has_target_pa && cacheSnoop &&
+            (inCache(target_paddr, new_pfi.isSecure()) ||
+            inMissQueue(target_paddr, new_pfi.isSecure()))) {
          pfInCache++;
          DPRINTF(HWPrefetch, "Dropping redundant in "
-                "cache/MSHR prefetch addr:%#x\n", target_addr);
+                "cache/MSHR prefetch addr:%#x\n", target_paddr);
          return;
      }
  
-    /* Create a prefetch memory request */
-    RequestPtr pf_req =
-        std::make_shared<Request>(target_addr, blkSize, 0, masterId);
-
-    if (new_pfi.isSecure()) {
-        pf_req->setFlags(Request::SECURE);
-    }
-    pf_req->taskId(ContextSwitchTaskId::Prefetcher);
-    PacketPtr pf_pkt = new Packet(pf_req, MemCmd::HardPFReq);
-    pf_pkt->allocate();
-    if (tagPrefetch && new_pfi.hasPC()) {
-        // Tag prefetch packet with  accessing pc
-        pf_pkt->req->setPC(new_pfi.getPC());
+    /* Create the packet and find the spot to insert it */
+    DeferredPacket dpp(this, new_pfi, 0, priority);
+    if (has_target_pa) {
+        Tick pf_time = curTick() + clockPeriod() * latency;
+        dpp.createPkt(target_paddr, blkSize, masterId, tagPrefetch, pf_time);
+        DPRINTF(HWPrefetch, "Prefetch queued. "
+                "addr:%#x priority: %3d tick:%lld.\n",
+                new_pfi.getAddr(), priority, pf_time);
+        addToQueue(pfq, dpp);
+    } else {
+        // Add the translation request and try to resolve it later
+        dpp.setTranslationRequest(translation_req);
+        dpp.tc = cache->system->getThreadContext(translation_req->contextId());
+        DPRINTF(HWPrefetch, "Prefetch queued with no translation. "
+                "addr:%#x priority: %3d\n", new_pfi.getAddr(), priority);
+        addToQueue(pfqMissingTranslation, dpp);
      }
+}
  
+void
+QueuedPrefetcher::addToQueue(std::list<DeferredPacket> &queue,
+                             DeferredPacket &dpp)
+{
      /* Verify prefetch buffer space for request */
-    if (pfq.size() == queueSize) {
+    if (queue.size() == queueSize) {
          pfRemovedFull++;
          /* Lowest priority packet */
-        iterator it = pfq.end();
-        panic_if (it == pfq.begin(), "Prefetch queue is both full and empty!");
+        iterator it = queue.end();
+        panic_if (it == queue.begin(),
+            "Prefetch queue is both full and empty!");
          --it;
          /* Look for oldest in that level of priority */
-        panic_if (it == pfq.begin(), "Prefetch queue is full with 1 element!");
+        panic_if (it == queue.begin(),
+            "Prefetch queue is full with 1 element!");
          iterator prev = it;
          bool cont = true;
          /* While not at the head of the queue */
-        while (cont && prev != pfq.begin()) {
+        while (cont && prev != queue.begin()) {
              prev--;
              /* While at the same level of priority */
              cont = prev->priority == it->priority;
@@ -267,29 +434,22 @@ QueuedPrefetcher::insert(const PacketPtr &pkt, PrefetchInfo &new_pfi,
                  it = prev;
          }
          DPRINTF(HWPrefetch, "Prefetch queue full, removing lowest priority "
-                            "oldest packet, addr: %#x", it->pfInfo.getAddr());
+                            "oldest packet, addr: %#x\n",it->pfInfo.getAddr());
          delete it->pkt;
-        pfq.erase(it);
+        queue.erase(it);
      }
  
-    Tick pf_time = curTick() + clockPeriod() * latency;
-    DPRINTF(HWPrefetch, "Prefetch queued. "
-            "addr:%#x priority: %3d tick:%lld.\n",
-            target_addr, priority, pf_time);
-
-    /* Create the packet and find the spot to insert it */
-    DeferredPacket dpp(new_pfi, pf_time, pf_pkt, priority);
-    if (pfq.size() == 0) {
-        pfq.emplace_back(dpp);
+    if (queue.size() == 0) {
+        queue.emplace_back(dpp);
      } else {
-        iterator it = pfq.end();
+        iterator it = queue.end();
          do {
              --it;
-        } while (it != pfq.begin() && dpp > *it);
+        } while (it != queue.begin() && dpp > *it);
          /* If we reach the head, we have to see if the new element is new head
           * or not */
-        if (it == pfq.begin() && dpp <= *it)
+        if (it == queue.begin() && dpp <= *it)
              it++;
-        pfq.insert(it, dpp);
+        queue.insert(it, dpp);
      }
  }
diff --git a/src/mem/cache/prefetch/queued.hh b/src/mem/cache/prefetch/queued.hh

index 97a7ec6bc244c9405e0713bc62ed5b4404fc358e..1ffbc9a6c81a397e43644fb264b9158da395e555 100644 (file)
--- a/src/mem/cache/prefetch/queued.hh
+++ b/src/mem/cache/prefetch/queued.hh
@@ -54,7 +54,9 @@ struct QueuedPrefetcherParams;
  class QueuedPrefetcher : public BasePrefetcher
  {
    protected:
-    struct DeferredPacket {
+    struct DeferredPacket : public BaseTLB::Translation {
+        /** Owner of the packet */
+        QueuedPrefetcher *owner;
          /** Prefetch info corresponding to this packet */
          PrefetchInfo pfInfo;
          /** Time when this prefetch becomes ready */
@@ -63,17 +65,22 @@ class QueuedPrefetcher : public BasePrefetcher
          PacketPtr pkt;
          /** The priority of this prefetch */
          int32_t priority;
+        /** Request used when a translation is needed */
+        RequestPtr translationRequest;
+        ThreadContext *tc;
+        bool ongoingTranslation;
  
          /**
           * Constructor
+         * @param o QueuedPrefetcher in charge of this request
           * @param pfi PrefechInfo object associated to this packet
           * @param t Time when this prefetch becomes ready
           * @param p PacketPtr with the memory request of the prefetch
           * @param prio This prefetch priority
           */
-        DeferredPacket(PrefetchInfo const &pfi, Tick t, PacketPtr p,
-                       int32_t prio) : pfInfo(pfi), tick(t), pkt(p),
-                       priority(prio) {
+        DeferredPacket(QueuedPrefetcher *o, PrefetchInfo const &pfi, Tick t,
+            int32_t prio) : owner(o), pfInfo(pfi), tick(t), pkt(nullptr),
+            priority(prio), translationRequest() {
          }
  
          bool operator>(const DeferredPacket& that) const
@@ -88,15 +95,59 @@ class QueuedPrefetcher : public BasePrefetcher
          {
              return !(*this > that);
          }
+
+        /**
+         * Create the associated memory packet
+         * @param paddr physical address of this packet
+         * @param blk_size block size used by the prefetcher
+         * @param mid Requester ID of the access that generated this prefetch
+         * @param tag_prefetch flag to indicate if the packet needs to be
+         *        tagged
+         * @param t time when the prefetch becomes ready
+         */
+        void createPkt(Addr paddr, unsigned blk_size, MasterID mid,
+                       bool tag_prefetch, Tick t);
+
+        /**
+         * Sets the translation request needed to obtain the physical address
+         * of this request.
+         * @param req The Request with the virtual address of this request
+         */
+        void setTranslationRequest(const RequestPtr &req)
+        {
+            translationRequest = req;
+        }
+
+        void markDelayed() override
+        {}
+
+        void finish(const Fault &fault, const RequestPtr &req,
+                            ThreadContext *tc, BaseTLB::Mode mode) override;
+
+        /**
+         * Issues the translation request to the provided TLB
+         * @param tlb the tlb that has to translate the address
+         */
+        void startTranslation(BaseTLB *tlb);
      };
  
      std::list<DeferredPacket> pfq;
+    std::list<DeferredPacket> pfqMissingTranslation;
+
+    using const_iterator = std::list<DeferredPacket>::const_iterator;
+    using iterator = std::list<DeferredPacket>::iterator;
  
      // PARAMETERS
  
      /** Maximum size of the prefetch queue */
      const unsigned queueSize;
  
+    /**
+     * Maximum size of the queue holding prefetch requests with missing
+     * address translations
+     */
+    const unsigned missingTranslationQueueSize;
+
      /** Cycles after generation when a prefetch can first be issued */
      const Cycles latency;
  
@@ -112,11 +163,6 @@ class QueuedPrefetcher : public BasePrefetcher
      /** Tag prefetch with PC of generating access? */
      const bool tagPrefetch;
  
-    using const_iterator = std::list<DeferredPacket>::const_iterator;
-    const_iterator inPrefetch(const PrefetchInfo &pfi) const;
-    using iterator = std::list<DeferredPacket>::iterator;
-    iterator inPrefetch(const PrefetchInfo &pfi);
-
      // STATS
      Stats::Scalar pfIdentified;
      Stats::Scalar pfBufferHit;
@@ -144,6 +190,47 @@ class QueuedPrefetcher : public BasePrefetcher
      }
  
      void regStats() override;
+
+  private:
+
+    /**
+     * Adds a DeferredPacket to the specified queue
+     * @param queue selected queue to use
+     * @param dpp DeferredPacket to add
+     */
+    void addToQueue(std::list<DeferredPacket> &queue, DeferredPacket &dpp);
+
+    /**
+     * Starts the translations of the queued prefetches with a
+     * missing translation. It performs a maximum specified number of
+     * translations. Successful translations cause the prefetch request to be
+     * queued in the queue of ready requests.
+     * @param max maximum number of translations to perform
+     */
+    void processMissingTranslations(unsigned max);
+
+    /**
+     * Indicates that the translation of the address of the provided  deferred
+     * packet has been successfully completed, and it can be enqueued as a
+     * new prefetch request.
+     * @param dp the deferred packet that has completed the translation request
+     * @param failed whether the translation was successful
+     */
+    void translationComplete(DeferredPacket *dp, bool failed);
+
+    /**
+     * Checks whether the specified prefetch request is already in the
+     * specified queue. If the request is found, its priority is updated.
+     * @param queue selected queue to check
+     * @param pfi information of the prefetch request to be added
+     * @param priority priority of the prefetch request to be added
+     * @return True if the prefetch request was found in the queue
+     */
+    bool alreadyInQueue(std::list<DeferredPacket> &queue,
+                        const PrefetchInfo &pfi, int32_t priority);
+
+    RequestPtr createPrefetchRequest(Addr addr, PrefetchInfo const &pfi,
+                                        PacketPtr pkt);
  };
  
  #endif //__MEM_CACHE_PREFETCH_QUEUED_HH__
author	Javier Bueno <javier.bueno@metempsy.com>
	Tue, 27 Nov 2018 15:15:53 +0000 (16:15 +0100)
committer	Javier Bueno Hedo <javier.bueno@metempsy.com>
	Wed, 29 May 2019 08:55:39 +0000 (08:55 +0000)
src/mem/cache/prefetch/Prefetcher.py		patch \| blob \| history
src/mem/cache/prefetch/base.cc		patch \| blob \| history
src/mem/cache/prefetch/base.hh		patch \| blob \| history
src/mem/cache/prefetch/queued.cc		patch \| blob \| history
src/mem/cache/prefetch/queued.hh		patch \| blob \| history