2 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood
3 * Copyright (c) 2009 Advanced Micro Devices, Inc.
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions are
8 * met: redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer;
10 * redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution;
13 * neither the name of the copyright holders nor the names of its
14 * contributors may be used to endorse or promote products derived from
15 * this software without specific prior written permission.
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
21 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
22 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 * AMD's contributions to the MOESI hammer protocol do not constitute an
30 * endorsement of its similarity to any AMD products.
32 * Authors: Milo Martin
36 machine(Directory, "AMD Hammer-like protocol")
37 : DirectoryMemory * directory,
38 CacheMemory * probeFilter,
39 MemoryControl * memBuffer,
40 int memory_controller_latency = 2,
41 bool probe_filter_enabled = false,
42 bool full_bit_dir_enabled = false
45 MessageBuffer forwardFromDir, network="To", virtual_network="3", ordered="false";
46 MessageBuffer responseFromDir, network="To", virtual_network="4", ordered="false";
48 // For a finite buffered network, note that the DMA response network only
49 // works at this relatively lower numbered (lower priority) virtual network
50 // because the trigger queue decouples cache responses from DMA responses.
52 MessageBuffer dmaResponseFromDir, network="To", virtual_network="1", ordered="true";
54 MessageBuffer unblockToDir, network="From", virtual_network="5", ordered="false";
55 MessageBuffer responseToDir, network="From", virtual_network="4", ordered="false";
56 MessageBuffer requestToDir, network="From", virtual_network="2", ordered="false", recycle_latency="1";
57 MessageBuffer dmaRequestToDir, network="From", virtual_network="0", ordered="true";
60 state_declaration(State, desc="Directory states", default="Directory_State_E") {
62 NX, AccessPermission:Invalid, desc="Not Owner, probe filter entry exists, block in O at Owner";
63 NO, AccessPermission:Invalid, desc="Not Owner, probe filter entry exists, block in E/M at Owner";
64 S, AccessPermission:Read_Only, desc="Data clean, probe filter entry exists pointing to the current owner";
65 O, AccessPermission:Read_Only, desc="Data clean, probe filter entry exists";
66 E, AccessPermission:Read_Write, desc="Exclusive Owner, no probe filter entry";
68 O_R, AccessPermission:Read_Only, desc="Was data Owner, replacing probe filter entry";
69 S_R, AccessPermission:Read_Only, desc="Was Not Owner or Sharer, replacing probe filter entry";
70 NO_R, AccessPermission:Invalid, desc="Was Not Owner or Sharer, replacing probe filter entry";
72 NO_B, AccessPermission:Invalid, "NO^B", desc="Not Owner, Blocked";
73 NO_B_X, AccessPermission:Invalid, "NO^B", desc="Not Owner, Blocked, next queued request GETX";
74 NO_B_S, AccessPermission:Invalid, "NO^B", desc="Not Owner, Blocked, next queued request GETS";
75 NO_B_S_W, AccessPermission:Invalid, "NO^B", desc="Not Owner, Blocked, forwarded merged GETS, waiting for responses";
76 O_B, AccessPermission:Invalid, "O^B", desc="Owner, Blocked";
77 NO_B_W, AccessPermission:Invalid, desc="Not Owner, Blocked, waiting for Dram";
78 O_B_W, AccessPermission:Invalid, desc="Owner, Blocked, waiting for Dram";
79 NO_W, AccessPermission:Invalid, desc="Not Owner, waiting for Dram";
80 O_W, AccessPermission:Invalid, desc="Owner, waiting for Dram";
81 NO_DW_B_W, AccessPermission:Invalid, desc="Not Owner, Dma Write waiting for Dram and cache responses";
82 NO_DR_B_W, AccessPermission:Invalid, desc="Not Owner, Dma Read waiting for Dram and cache responses";
83 NO_DR_B_D, AccessPermission:Invalid, desc="Not Owner, Dma Read waiting for cache responses including dirty data";
84 NO_DR_B, AccessPermission:Invalid, desc="Not Owner, Dma Read waiting for cache responses";
85 NO_DW_W, AccessPermission:Invalid, desc="Not Owner, Dma Write waiting for Dram";
86 O_DR_B_W, AccessPermission:Invalid, desc="Owner, Dma Read waiting for Dram and cache responses";
87 O_DR_B, AccessPermission:Invalid, desc="Owner, Dma Read waiting for cache responses";
88 WB, AccessPermission:Invalid, desc="Blocked on a writeback";
89 WB_O_W, AccessPermission:Invalid, desc="Blocked on memory write, will go to O";
90 WB_E_W, AccessPermission:Invalid, desc="Blocked on memory write, will go to E";
94 enumeration(Event, desc="Directory events") {
95 GETX, desc="A GETX arrives";
96 GETS, desc="A GETS arrives";
97 PUT, desc="A PUT arrives";
98 Unblock, desc="An unblock message arrives";
99 UnblockS, desc="An unblock message arrives";
100 UnblockM, desc="An unblock message arrives";
101 Writeback_Clean, desc="The final part of a PutX (no data)";
102 Writeback_Dirty, desc="The final part of a PutX (data)";
103 Writeback_Exclusive_Clean, desc="The final part of a PutX (no data, exclusive)";
104 Writeback_Exclusive_Dirty, desc="The final part of a PutX (data, exclusive)";
107 Pf_Replacement, desc="probe filter replacement";
110 DMA_READ, desc="A DMA Read memory request";
111 DMA_WRITE, desc="A DMA Write memory request";
114 Memory_Data, desc="Fetched data from memory arrives";
115 Memory_Ack, desc="Writeback Ack from memory arrives";
117 // Cache responses required to handle DMA
118 Ack, desc="Received an ack message";
119 Shared_Ack, desc="Received an ack message, responder has a shared copy";
120 Shared_Data, desc="Received a data message, responder has a shared copy";
121 Data, desc="Received a data message, responder had a owner or exclusive copy, they gave it to us";
122 Exclusive_Data, desc="Received a data message, responder had an exclusive copy, they gave it to us";
125 All_acks_and_shared_data, desc="Received shared data and message acks";
126 All_acks_and_owner_data, desc="Received shared data and message acks";
127 All_acks_and_data_no_sharers, desc="Received all acks and no other processor has a shared copy";
128 All_Unblocks, desc="Received all unblocks for a merged gets request";
134 structure(Entry, desc="...", interface="AbstractEntry") {
135 State DirectoryState, desc="Directory state";
136 DataBlock DataBlk, desc="data for the block";
140 structure(PfEntry, desc="...", interface="AbstractCacheEntry") {
141 State PfState, desc="Directory state";
142 MachineID Owner, desc="Owner node";
143 DataBlock DataBlk, desc="data for the block";
144 Set Sharers, desc="sharing vector for full bit directory";
147 // TBE entries for DMA requests
148 structure(TBE, desc="TBE entries for outstanding DMA requests") {
149 Address PhysicalAddress, desc="physical address";
150 State TBEState, desc="Transient State";
151 CoherenceResponseType ResponseType, desc="The type for the subsequent response message";
152 int Acks, default="0", desc="The number of acks that the waiting response represents";
153 int SilentAcks, default="0", desc="The number of silent acks associated with this transaction";
154 DataBlock DmaDataBlk, desc="DMA Data to be written. Partial blocks need to merged with system memory";
155 DataBlock DataBlk, desc="The current view of system memory";
157 MachineID DmaRequestor, desc="DMA requestor";
158 NetDest GetSRequestors, desc="GETS merged requestors";
159 int NumPendingMsgs, desc="Number of pending acks/messages";
160 bool CacheDirty, default="false", desc="Indicates whether a cache has responded with dirty data";
161 bool Sharers, default="false", desc="Indicates whether a cache has indicated it is currently a sharer";
162 bool Owned, default="false", desc="Indicates whether a cache has indicated it is currently a sharer";
165 structure(TBETable, external="yes") {
167 void allocate(Address);
168 void deallocate(Address);
169 bool isPresent(Address);
172 void set_cache_entry(AbstractCacheEntry b);
173 void unset_cache_entry();
176 void wakeUpBuffers(Address a);
182 TBETable TBEs, template_hack="<Directory_TBE>";
184 Entry getDirectoryEntry(Address addr), return_by_ref="yes" {
185 return static_cast(Entry, directory[addr]);
188 PfEntry getProbeFilterEntry(Address addr), return_by_pointer="yes" {
189 if (probe_filter_enabled || full_bit_dir_enabled) {
190 PfEntry pfEntry := static_cast(PfEntry, "pointer", probeFilter.lookup(addr));
196 State getState(TBE tbe, PfEntry pf_entry, Address addr) {
200 if (probe_filter_enabled || full_bit_dir_enabled) {
201 if (is_valid(pf_entry)) {
202 assert(pf_entry.PfState == getDirectoryEntry(addr).DirectoryState);
205 return getDirectoryEntry(addr).DirectoryState;
209 void setState(TBE tbe, PfEntry pf_entry, Address addr, State state) {
211 tbe.TBEState := state;
213 if (probe_filter_enabled || full_bit_dir_enabled) {
214 if (is_valid(pf_entry)) {
215 pf_entry.PfState := state;
217 if (state == State:NX || state == State:NO || state == State:S || state == State:O) {
218 assert(is_valid(pf_entry));
220 if (state == State:E) {
221 assert(is_valid(pf_entry) == false);
224 if (state == State:E || state == State:NX || state == State:NO || state == State:S ||
226 assert(is_valid(tbe) == false);
228 getDirectoryEntry(addr).DirectoryState := state;
231 Event cache_request_to_event(CoherenceRequestType type) {
232 if (type == CoherenceRequestType:GETS) {
234 } else if (type == CoherenceRequestType:GETX) {
237 error("Invalid CoherenceRequestType");
241 MessageBuffer triggerQueue, ordered="true";
244 out_port(requestQueue_out, ResponseMsg, requestToDir); // For recycling requests
245 out_port(forwardNetwork_out, RequestMsg, forwardFromDir);
246 out_port(responseNetwork_out, ResponseMsg, responseFromDir);
247 out_port(dmaResponseNetwork_out, DMAResponseMsg, dmaResponseFromDir);
248 out_port(triggerQueue_out, TriggerMsg, triggerQueue);
251 // Memory buffer for memory controller to DIMM communication
253 out_port(memQueue_out, MemoryMsg, memBuffer);
258 in_port(triggerQueue_in, TriggerMsg, triggerQueue, rank=5) {
259 if (triggerQueue_in.isReady()) {
260 peek(triggerQueue_in, TriggerMsg) {
261 PfEntry pf_entry := getProbeFilterEntry(in_msg.Address);
262 TBE tbe := TBEs[in_msg.Address];
263 if (in_msg.Type == TriggerType:ALL_ACKS) {
264 trigger(Event:All_acks_and_owner_data, in_msg.Address,
266 } else if (in_msg.Type == TriggerType:ALL_ACKS_OWNER_EXISTS) {
267 trigger(Event:All_acks_and_shared_data, in_msg.Address,
269 } else if (in_msg.Type == TriggerType:ALL_ACKS_NO_SHARERS) {
270 trigger(Event:All_acks_and_data_no_sharers, in_msg.Address,
272 } else if (in_msg.Type == TriggerType:ALL_UNBLOCKS) {
273 trigger(Event:All_Unblocks, in_msg.Address,
276 error("Unexpected message");
282 in_port(unblockNetwork_in, ResponseMsg, unblockToDir, rank=4) {
283 if (unblockNetwork_in.isReady()) {
284 peek(unblockNetwork_in, ResponseMsg) {
285 PfEntry pf_entry := getProbeFilterEntry(in_msg.Address);
286 TBE tbe := TBEs[in_msg.Address];
287 if (in_msg.Type == CoherenceResponseType:UNBLOCK) {
288 trigger(Event:Unblock, in_msg.Address, pf_entry, tbe);
289 } else if (in_msg.Type == CoherenceResponseType:UNBLOCKS) {
290 trigger(Event:UnblockS, in_msg.Address, pf_entry, tbe);
291 } else if (in_msg.Type == CoherenceResponseType:UNBLOCKM) {
292 trigger(Event:UnblockM, in_msg.Address, pf_entry, tbe);
293 } else if (in_msg.Type == CoherenceResponseType:WB_CLEAN) {
294 trigger(Event:Writeback_Clean, in_msg.Address, pf_entry, tbe);
295 } else if (in_msg.Type == CoherenceResponseType:WB_DIRTY) {
296 trigger(Event:Writeback_Dirty, in_msg.Address, pf_entry, tbe);
297 } else if (in_msg.Type == CoherenceResponseType:WB_EXCLUSIVE_CLEAN) {
298 trigger(Event:Writeback_Exclusive_Clean, in_msg.Address,
300 } else if (in_msg.Type == CoherenceResponseType:WB_EXCLUSIVE_DIRTY) {
301 trigger(Event:Writeback_Exclusive_Dirty, in_msg.Address,
304 error("Invalid message");
311 in_port(responseToDir_in, ResponseMsg, responseToDir, rank=3) {
312 if (responseToDir_in.isReady()) {
313 peek(responseToDir_in, ResponseMsg) {
314 PfEntry pf_entry := getProbeFilterEntry(in_msg.Address);
315 TBE tbe := TBEs[in_msg.Address];
316 if (in_msg.Type == CoherenceResponseType:ACK) {
317 trigger(Event:Ack, in_msg.Address, pf_entry, tbe);
318 } else if (in_msg.Type == CoherenceResponseType:ACK_SHARED) {
319 trigger(Event:Shared_Ack, in_msg.Address, pf_entry, tbe);
320 } else if (in_msg.Type == CoherenceResponseType:DATA_SHARED) {
321 trigger(Event:Shared_Data, in_msg.Address, pf_entry, tbe);
322 } else if (in_msg.Type == CoherenceResponseType:DATA) {
323 trigger(Event:Data, in_msg.Address, pf_entry, tbe);
324 } else if (in_msg.Type == CoherenceResponseType:DATA_EXCLUSIVE) {
325 trigger(Event:Exclusive_Data, in_msg.Address, pf_entry, tbe);
327 error("Unexpected message");
333 // off-chip memory request/response is done
334 in_port(memQueue_in, MemoryMsg, memBuffer, rank=2) {
335 if (memQueue_in.isReady()) {
336 peek(memQueue_in, MemoryMsg) {
337 PfEntry pf_entry := getProbeFilterEntry(in_msg.Address);
338 TBE tbe := TBEs[in_msg.Address];
339 if (in_msg.Type == MemoryRequestType:MEMORY_READ) {
340 trigger(Event:Memory_Data, in_msg.Address, pf_entry, tbe);
341 } else if (in_msg.Type == MemoryRequestType:MEMORY_WB) {
342 trigger(Event:Memory_Ack, in_msg.Address, pf_entry, tbe);
344 DPRINTF(RubySlicc, "%d\n", in_msg.Type);
345 error("Invalid message");
351 in_port(requestQueue_in, RequestMsg, requestToDir, rank=1) {
352 if (requestQueue_in.isReady()) {
353 peek(requestQueue_in, RequestMsg) {
354 PfEntry pf_entry := getProbeFilterEntry(in_msg.Address);
355 TBE tbe := TBEs[in_msg.Address];
356 if (in_msg.Type == CoherenceRequestType:PUT) {
357 trigger(Event:PUT, in_msg.Address, pf_entry, tbe);
359 if (probe_filter_enabled || full_bit_dir_enabled) {
360 if (is_valid(pf_entry)) {
361 trigger(cache_request_to_event(in_msg.Type), in_msg.Address,
364 if (probeFilter.cacheAvail(in_msg.Address)) {
365 trigger(cache_request_to_event(in_msg.Type), in_msg.Address,
368 trigger(Event:Pf_Replacement,
369 probeFilter.cacheProbe(in_msg.Address),
370 getProbeFilterEntry(probeFilter.cacheProbe(in_msg.Address)),
371 TBEs[probeFilter.cacheProbe(in_msg.Address)]);
375 trigger(cache_request_to_event(in_msg.Type), in_msg.Address,
383 in_port(dmaRequestQueue_in, DMARequestMsg, dmaRequestToDir, rank=0) {
384 if (dmaRequestQueue_in.isReady()) {
385 peek(dmaRequestQueue_in, DMARequestMsg) {
386 PfEntry pf_entry := getProbeFilterEntry(in_msg.LineAddress);
387 TBE tbe := TBEs[in_msg.LineAddress];
388 if (in_msg.Type == DMARequestType:READ) {
389 trigger(Event:DMA_READ, in_msg.LineAddress, pf_entry, tbe);
390 } else if (in_msg.Type == DMARequestType:WRITE) {
391 trigger(Event:DMA_WRITE, in_msg.LineAddress, pf_entry, tbe);
393 error("Invalid message");
401 action(r_setMRU, "\rr", desc="manually set the MRU bit for pf entry" ) {
402 if (probe_filter_enabled || full_bit_dir_enabled) {
403 assert(is_valid(cache_entry));
404 probeFilter.setMRU(address);
408 action(auno_assertUnblockerNotOwner, "auno", desc="assert unblocker not owner") {
409 if (probe_filter_enabled || full_bit_dir_enabled) {
410 assert(is_valid(cache_entry));
411 peek(unblockNetwork_in, ResponseMsg) {
412 assert(cache_entry.Owner != in_msg.Sender);
413 if (full_bit_dir_enabled) {
414 assert(cache_entry.Sharers.isElement(machineIDToNodeID(in_msg.Sender)) == false);
420 action(uo_updateOwnerIfPf, "uo", desc="update owner") {
421 if (probe_filter_enabled || full_bit_dir_enabled) {
422 assert(is_valid(cache_entry));
423 peek(unblockNetwork_in, ResponseMsg) {
424 cache_entry.Owner := in_msg.Sender;
425 if (full_bit_dir_enabled) {
426 cache_entry.Sharers.clear();
427 cache_entry.Sharers.add(machineIDToNodeID(in_msg.Sender));
428 APPEND_TRANSITION_COMMENT(cache_entry.Sharers);
429 DPRINTF(RubySlicc, "Sharers = %d\n", cache_entry.Sharers);
435 action(us_updateSharerIfFBD, "us", desc="update sharer if full-bit directory") {
436 if (full_bit_dir_enabled) {
437 assert(probeFilter.isTagPresent(address));
438 peek(unblockNetwork_in, ResponseMsg) {
439 cache_entry.Sharers.add(machineIDToNodeID(in_msg.Sender));
444 action(a_sendWriteBackAck, "a", desc="Send writeback ack to requestor") {
445 peek(requestQueue_in, RequestMsg) {
446 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
447 out_msg.Address := address;
448 out_msg.Type := CoherenceRequestType:WB_ACK;
449 out_msg.Requestor := in_msg.Requestor;
450 out_msg.Destination.add(in_msg.Requestor);
451 out_msg.MessageSize := MessageSizeType:Writeback_Control;
456 action(b_sendWriteBackNack, "b", desc="Send writeback nack to requestor") {
457 peek(requestQueue_in, RequestMsg) {
458 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
459 out_msg.Address := address;
460 out_msg.Type := CoherenceRequestType:WB_NACK;
461 out_msg.Requestor := in_msg.Requestor;
462 out_msg.Destination.add(in_msg.Requestor);
463 out_msg.MessageSize := MessageSizeType:Writeback_Control;
468 action(pfa_probeFilterAllocate, "pfa", desc="Allocate ProbeFilterEntry") {
469 if (probe_filter_enabled || full_bit_dir_enabled) {
470 peek(requestQueue_in, RequestMsg) {
471 set_cache_entry(probeFilter.allocate(address, new PfEntry));
472 cache_entry.Owner := in_msg.Requestor;
473 cache_entry.Sharers.setSize(machineCount(MachineType:L1Cache));
478 action(pfd_probeFilterDeallocate, "pfd", desc="Deallocate ProbeFilterEntry") {
479 if (probe_filter_enabled || full_bit_dir_enabled) {
480 probeFilter.deallocate(address);
485 action(ppfd_possibleProbeFilterDeallocate, "ppfd", desc="Deallocate ProbeFilterEntry") {
486 if ((probe_filter_enabled || full_bit_dir_enabled) && is_valid(cache_entry)) {
487 probeFilter.deallocate(address);
492 action(v_allocateTBE, "v", desc="Allocate TBE") {
493 peek(requestQueue_in, RequestMsg) {
494 TBEs.allocate(address);
495 set_tbe(TBEs[address]);
496 tbe.PhysicalAddress := address;
497 tbe.ResponseType := CoherenceResponseType:NULL;
501 action(vd_allocateDmaRequestInTBE, "vd", desc="Record Data in TBE") {
502 peek(dmaRequestQueue_in, DMARequestMsg) {
503 TBEs.allocate(address);
504 set_tbe(TBEs[address]);
505 tbe.DmaDataBlk := in_msg.DataBlk;
506 tbe.PhysicalAddress := in_msg.PhysicalAddress;
507 tbe.Len := in_msg.Len;
508 tbe.DmaRequestor := in_msg.Requestor;
509 tbe.ResponseType := CoherenceResponseType:DATA_EXCLUSIVE;
511 // One ack for each last-level cache
513 tbe.NumPendingMsgs := machineCount(MachineType:L1Cache);
515 // Assume initially that the caches store a clean copy and that memory
516 // will provide the data
518 tbe.CacheDirty := false;
522 action(pa_setPendingMsgsToAll, "pa", desc="set pending msgs to all") {
523 assert(is_valid(tbe));
524 if (full_bit_dir_enabled) {
525 assert(is_valid(cache_entry));
526 tbe.NumPendingMsgs := cache_entry.Sharers.count();
528 tbe.NumPendingMsgs := machineCount(MachineType:L1Cache);
532 action(po_setPendingMsgsToOne, "po", desc="set pending msgs to one") {
533 assert(is_valid(tbe));
534 tbe.NumPendingMsgs := 1;
537 action(w_deallocateTBE, "w", desc="Deallocate TBE") {
538 TBEs.deallocate(address);
542 action(sa_setAcksToOne, "sa", desc="Forwarded request, set the ack amount to one") {
543 assert(is_valid(tbe));
544 peek(requestQueue_in, RequestMsg) {
545 if (full_bit_dir_enabled) {
546 assert(is_valid(cache_entry));
548 // If we are using the full-bit directory and no sharers exists beyond
549 // the requestor, then we must set the ack number to all, not one
551 fwd_set := cache_entry.Sharers;
552 fwd_set.remove(machineIDToNodeID(in_msg.Requestor));
553 if (fwd_set.count() > 0) {
555 tbe.SilentAcks := machineCount(MachineType:L1Cache) - fwd_set.count();
556 tbe.SilentAcks := tbe.SilentAcks - 1;
558 tbe.Acks := machineCount(MachineType:L1Cache);
567 action(saa_setAcksToAllIfPF, "saa", desc="Non-forwarded request, set the ack amount to all") {
568 assert(is_valid(tbe));
569 if (probe_filter_enabled || full_bit_dir_enabled) {
570 tbe.Acks := machineCount(MachineType:L1Cache);
577 action(m_decrementNumberOfMessages, "m", desc="Decrement the number of messages for which we're waiting") {
578 peek(responseToDir_in, ResponseMsg) {
579 assert(is_valid(tbe));
580 assert(in_msg.Acks > 0);
581 DPRINTF(RubySlicc, "%d\n", tbe.NumPendingMsgs);
583 // Note that cache data responses will have an ack count of 2. However,
584 // directory DMA requests must wait for acks from all LLC caches, so
585 // only decrement by 1.
587 if ((in_msg.Type == CoherenceResponseType:DATA_SHARED) ||
588 (in_msg.Type == CoherenceResponseType:DATA) ||
589 (in_msg.Type == CoherenceResponseType:DATA_EXCLUSIVE)) {
590 tbe.NumPendingMsgs := tbe.NumPendingMsgs - 1;
592 tbe.NumPendingMsgs := tbe.NumPendingMsgs - in_msg.Acks;
594 DPRINTF(RubySlicc, "%d\n", tbe.NumPendingMsgs);
598 action(mu_decrementNumberOfUnblocks, "mu", desc="Decrement the number of messages for which we're waiting") {
599 peek(unblockNetwork_in, ResponseMsg) {
600 assert(is_valid(tbe));
601 assert(in_msg.Type == CoherenceResponseType:UNBLOCKS);
602 DPRINTF(RubySlicc, "%d\n", tbe.NumPendingMsgs);
603 tbe.NumPendingMsgs := tbe.NumPendingMsgs - 1;
604 DPRINTF(RubySlicc, "%d\n", tbe.NumPendingMsgs);
608 action(n_popResponseQueue, "n", desc="Pop response queue") {
609 responseToDir_in.dequeue();
612 action(o_checkForCompletion, "o", desc="Check if we have received all the messages required for completion") {
613 assert(is_valid(tbe));
614 if (tbe.NumPendingMsgs == 0) {
615 enqueue(triggerQueue_out, TriggerMsg) {
616 out_msg.Address := address;
619 out_msg.Type := TriggerType:ALL_ACKS_OWNER_EXISTS;
621 out_msg.Type := TriggerType:ALL_ACKS;
624 out_msg.Type := TriggerType:ALL_ACKS_NO_SHARERS;
630 action(os_checkForMergedGetSCompletion, "os", desc="Check for merged GETS completion") {
631 assert(is_valid(tbe));
632 if (tbe.NumPendingMsgs == 0) {
633 enqueue(triggerQueue_out, TriggerMsg) {
634 out_msg.Address := address;
635 out_msg.Type := TriggerType:ALL_UNBLOCKS;
640 action(sp_setPendingMsgsToMergedSharers, "sp", desc="Set pending messages to waiting sharers") {
641 assert(is_valid(tbe));
642 tbe.NumPendingMsgs := tbe.GetSRequestors.count();
645 action(spa_setPendingAcksToZeroIfPF, "spa", desc="if probe filter, no need to wait for acks") {
646 if (probe_filter_enabled || full_bit_dir_enabled) {
647 assert(is_valid(tbe));
648 tbe.NumPendingMsgs := 0;
652 action(sc_signalCompletionIfPF, "sc", desc="indicate that we should skip waiting for cpu acks") {
653 assert(is_valid(tbe));
654 if (tbe.NumPendingMsgs == 0) {
655 assert(probe_filter_enabled || full_bit_dir_enabled);
656 enqueue(triggerQueue_out, TriggerMsg) {
657 out_msg.Address := address;
658 out_msg.Type := TriggerType:ALL_ACKS_NO_SHARERS;
663 action(d_sendData, "d", desc="Send data to requestor") {
664 peek(memQueue_in, MemoryMsg) {
665 enqueue(responseNetwork_out, ResponseMsg, latency="1") {
666 assert(is_valid(tbe));
667 out_msg.Address := address;
668 out_msg.Type := tbe.ResponseType;
669 out_msg.Sender := machineID;
670 out_msg.Destination.add(in_msg.OriginalRequestorMachId);
671 out_msg.DataBlk := in_msg.DataBlk;
672 DPRINTF(RubySlicc, "%s\n", out_msg.DataBlk);
673 out_msg.Dirty := false; // By definition, the block is now clean
674 out_msg.Acks := tbe.Acks;
675 out_msg.SilentAcks := tbe.SilentAcks;
676 DPRINTF(RubySlicc, "%d\n", out_msg.Acks);
677 assert(out_msg.Acks > 0);
678 out_msg.MessageSize := MessageSizeType:Response_Data;
683 action(dr_sendDmaData, "dr", desc="Send Data to DMA controller from memory") {
684 peek(memQueue_in, MemoryMsg) {
685 enqueue(dmaResponseNetwork_out, DMAResponseMsg, latency="1") {
686 assert(is_valid(tbe));
687 out_msg.PhysicalAddress := address;
688 out_msg.LineAddress := address;
689 out_msg.Type := DMAResponseType:DATA;
691 // we send the entire data block and rely on the dma controller to
692 // split it up if need be
694 out_msg.DataBlk := in_msg.DataBlk;
695 out_msg.Destination.add(tbe.DmaRequestor);
696 out_msg.MessageSize := MessageSizeType:Response_Data;
701 action(dt_sendDmaDataFromTbe, "dt", desc="Send Data to DMA controller from tbe") {
702 peek(triggerQueue_in, TriggerMsg) {
703 enqueue(dmaResponseNetwork_out, DMAResponseMsg, latency="1") {
704 assert(is_valid(tbe));
705 out_msg.PhysicalAddress := address;
706 out_msg.LineAddress := address;
707 out_msg.Type := DMAResponseType:DATA;
709 // we send the entire data block and rely on the dma controller to
710 // split it up if need be
712 out_msg.DataBlk := tbe.DataBlk;
713 out_msg.Destination.add(tbe.DmaRequestor);
714 out_msg.MessageSize := MessageSizeType:Response_Data;
719 action(da_sendDmaAck, "da", desc="Send Ack to DMA controller") {
720 enqueue(dmaResponseNetwork_out, DMAResponseMsg, latency="1") {
721 assert(is_valid(tbe));
722 out_msg.PhysicalAddress := address;
723 out_msg.LineAddress := address;
724 out_msg.Type := DMAResponseType:ACK;
725 out_msg.Destination.add(tbe.DmaRequestor);
726 out_msg.MessageSize := MessageSizeType:Writeback_Control;
730 action(rx_recordExclusiveInTBE, "rx", desc="Record Exclusive in TBE") {
731 peek(requestQueue_in, RequestMsg) {
732 assert(is_valid(tbe));
733 tbe.ResponseType := CoherenceResponseType:DATA_EXCLUSIVE;
737 action(r_recordDataInTBE, "rt", desc="Record Data in TBE") {
738 peek(requestQueue_in, RequestMsg) {
739 assert(is_valid(tbe));
740 if (full_bit_dir_enabled) {
741 fwd_set := cache_entry.Sharers;
742 fwd_set.remove(machineIDToNodeID(in_msg.Requestor));
743 if (fwd_set.count() > 0) {
744 tbe.ResponseType := CoherenceResponseType:DATA;
746 tbe.ResponseType := CoherenceResponseType:DATA_EXCLUSIVE;
749 tbe.ResponseType := CoherenceResponseType:DATA;
754 action(rs_recordGetSRequestor, "rs", desc="Record GETS requestor in TBE") {
755 peek(requestQueue_in, RequestMsg) {
756 assert(is_valid(tbe));
757 tbe.GetSRequestors.add(in_msg.Requestor);
761 action(r_setSharerBit, "r", desc="We saw other sharers") {
762 assert(is_valid(tbe));
766 action(so_setOwnerBit, "so", desc="We saw other sharers") {
767 assert(is_valid(tbe));
772 action(qf_queueMemoryFetchRequest, "qf", desc="Queue off-chip fetch request") {
773 peek(requestQueue_in, RequestMsg) {
774 enqueue(memQueue_out, MemoryMsg, latency="1") {
775 out_msg.Address := address;
776 out_msg.Type := MemoryRequestType:MEMORY_READ;
777 out_msg.Sender := machineID;
778 out_msg.OriginalRequestorMachId := in_msg.Requestor;
779 out_msg.MessageSize := in_msg.MessageSize;
780 out_msg.DataBlk := getDirectoryEntry(address).DataBlk;
781 DPRINTF(RubySlicc, "%s\n", out_msg);
786 action(qd_queueMemoryRequestFromDmaRead, "qd", desc="Queue off-chip fetch request") {
787 peek(dmaRequestQueue_in, DMARequestMsg) {
788 enqueue(memQueue_out, MemoryMsg, latency="1") {
789 out_msg.Address := address;
790 out_msg.Type := MemoryRequestType:MEMORY_READ;
791 out_msg.Sender := machineID;
792 out_msg.OriginalRequestorMachId := in_msg.Requestor;
793 out_msg.MessageSize := in_msg.MessageSize;
794 out_msg.DataBlk := getDirectoryEntry(address).DataBlk;
795 DPRINTF(RubySlicc, "%s\n", out_msg);
800 action(fn_forwardRequestIfNecessary, "fn", desc="Forward requests if necessary") {
801 assert(is_valid(tbe));
802 if ((machineCount(MachineType:L1Cache) > 1) && (tbe.Acks <= 1)) {
803 if (full_bit_dir_enabled) {
804 assert(is_valid(cache_entry));
805 peek(requestQueue_in, RequestMsg) {
806 fwd_set := cache_entry.Sharers;
807 fwd_set.remove(machineIDToNodeID(in_msg.Requestor));
808 if (fwd_set.count() > 0) {
809 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
810 out_msg.Address := address;
811 out_msg.Type := in_msg.Type;
812 out_msg.Requestor := in_msg.Requestor;
813 out_msg.Destination.setNetDest(MachineType:L1Cache, fwd_set);
814 out_msg.MessageSize := MessageSizeType:Multicast_Control;
815 out_msg.InitialRequestTime := in_msg.InitialRequestTime;
816 out_msg.ForwardRequestTime := get_time();
817 assert(tbe.SilentAcks > 0);
818 out_msg.SilentAcks := tbe.SilentAcks;
823 peek(requestQueue_in, RequestMsg) {
824 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
825 out_msg.Address := address;
826 out_msg.Type := in_msg.Type;
827 out_msg.Requestor := in_msg.Requestor;
828 out_msg.Destination.broadcast(MachineType:L1Cache); // Send to all L1 caches
829 out_msg.Destination.remove(in_msg.Requestor); // Don't include the original requestor
830 out_msg.MessageSize := MessageSizeType:Broadcast_Control;
831 out_msg.InitialRequestTime := in_msg.InitialRequestTime;
832 out_msg.ForwardRequestTime := get_time();
839 action(ia_invalidateAllRequest, "ia", desc="invalidate all copies") {
840 if (machineCount(MachineType:L1Cache) > 1) {
841 if (full_bit_dir_enabled) {
842 assert(cache_entry.Sharers.count() > 0);
843 peek(requestQueue_in, RequestMsg) {
844 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
845 out_msg.Address := address;
846 out_msg.Type := CoherenceRequestType:INV;
847 out_msg.Requestor := machineID;
848 out_msg.Destination.setNetDest(MachineType:L1Cache, cache_entry.Sharers);
849 out_msg.MessageSize := MessageSizeType:Multicast_Control;
853 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
854 out_msg.Address := address;
855 out_msg.Type := CoherenceRequestType:INV;
856 out_msg.Requestor := machineID;
857 out_msg.Destination.broadcast(MachineType:L1Cache); // Send to all L1 caches
858 out_msg.MessageSize := MessageSizeType:Broadcast_Control;
864 action(io_invalidateOwnerRequest, "io", desc="invalidate all copies") {
865 if (machineCount(MachineType:L1Cache) > 1) {
866 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
867 assert(is_valid(cache_entry));
868 out_msg.Address := address;
869 out_msg.Type := CoherenceRequestType:INV;
870 out_msg.Requestor := machineID;
871 out_msg.Destination.add(cache_entry.Owner);
872 out_msg.MessageSize := MessageSizeType:Request_Control;
873 out_msg.DirectedProbe := true;
878 action(fb_forwardRequestBcast, "fb", desc="Forward requests to all nodes") {
879 if (machineCount(MachineType:L1Cache) > 1) {
880 peek(requestQueue_in, RequestMsg) {
881 if (full_bit_dir_enabled) {
882 fwd_set := cache_entry.Sharers;
883 fwd_set.remove(machineIDToNodeID(in_msg.Requestor));
884 if (fwd_set.count() > 0) {
885 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
886 out_msg.Address := address;
887 out_msg.Type := in_msg.Type;
888 out_msg.Requestor := in_msg.Requestor;
889 out_msg.Destination.setNetDest(MachineType:L1Cache, fwd_set);
890 out_msg.MessageSize := MessageSizeType:Multicast_Control;
891 out_msg.InitialRequestTime := in_msg.InitialRequestTime;
892 out_msg.ForwardRequestTime := get_time();
893 out_msg.SilentAcks := machineCount(MachineType:L1Cache) - fwd_set.count();
894 out_msg.SilentAcks := out_msg.SilentAcks - 1;
898 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
899 out_msg.Address := address;
900 out_msg.Type := in_msg.Type;
901 out_msg.Requestor := in_msg.Requestor;
902 out_msg.Destination.broadcast(MachineType:L1Cache); // Send to all L1 caches
903 out_msg.Destination.remove(in_msg.Requestor); // Don't include the original requestor
904 out_msg.MessageSize := MessageSizeType:Broadcast_Control;
905 out_msg.InitialRequestTime := in_msg.InitialRequestTime;
906 out_msg.ForwardRequestTime := get_time();
913 action(fr_forwardMergeReadRequestsToOwner, "frr", desc="Forward coalesced read request to owner") {
914 assert(machineCount(MachineType:L1Cache) > 1);
916 // Fixme! The unblock network should not stall on the forward network. Add a trigger queue to
919 peek(unblockNetwork_in, ResponseMsg) {
920 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
921 assert(is_valid(tbe));
922 out_msg.Address := address;
923 out_msg.Type := CoherenceRequestType:MERGED_GETS;
924 out_msg.MergedRequestors := tbe.GetSRequestors;
925 if (in_msg.Type == CoherenceResponseType:UNBLOCKS) {
926 out_msg.Destination.add(in_msg.CurOwner);
928 out_msg.Destination.add(in_msg.Sender);
930 out_msg.MessageSize := MessageSizeType:Request_Control;
931 out_msg.InitialRequestTime := zero_time();
932 out_msg.ForwardRequestTime := get_time();
937 action(fc_forwardRequestConditionalOwner, "fc", desc="Forward request to one or more nodes") {
938 assert(machineCount(MachineType:L1Cache) > 1);
939 if (probe_filter_enabled || full_bit_dir_enabled) {
940 peek(requestQueue_in, RequestMsg) {
941 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
942 assert(is_valid(cache_entry));
943 out_msg.Address := address;
944 out_msg.Type := in_msg.Type;
945 out_msg.Requestor := in_msg.Requestor;
946 out_msg.Destination.add(cache_entry.Owner);
947 out_msg.MessageSize := MessageSizeType:Request_Control;
948 out_msg.DirectedProbe := true;
949 out_msg.InitialRequestTime := in_msg.InitialRequestTime;
950 out_msg.ForwardRequestTime := get_time();
954 peek(requestQueue_in, RequestMsg) {
955 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
956 out_msg.Address := address;
957 out_msg.Type := in_msg.Type;
958 out_msg.Requestor := in_msg.Requestor;
959 out_msg.Destination.broadcast(MachineType:L1Cache); // Send to all L1 caches
960 out_msg.Destination.remove(in_msg.Requestor); // Don't include the original requestor
961 out_msg.MessageSize := MessageSizeType:Broadcast_Control;
962 out_msg.InitialRequestTime := in_msg.InitialRequestTime;
963 out_msg.ForwardRequestTime := get_time();
969 action(f_forwardWriteFromDma, "fw", desc="Forward requests") {
970 assert(is_valid(tbe));
971 if (tbe.NumPendingMsgs > 0) {
972 peek(dmaRequestQueue_in, DMARequestMsg) {
973 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
974 out_msg.Address := address;
975 out_msg.Type := CoherenceRequestType:GETX;
977 // Send to all L1 caches, since the requestor is the memory controller
980 out_msg.Requestor := machineID;
981 out_msg.Destination.broadcast(MachineType:L1Cache);
982 out_msg.MessageSize := MessageSizeType:Broadcast_Control;
988 action(f_forwardReadFromDma, "fr", desc="Forward requests") {
989 assert(is_valid(tbe));
990 if (tbe.NumPendingMsgs > 0) {
991 peek(dmaRequestQueue_in, DMARequestMsg) {
992 enqueue(forwardNetwork_out, RequestMsg, latency=memory_controller_latency) {
993 out_msg.Address := address;
994 out_msg.Type := CoherenceRequestType:GETS;
996 // Send to all L1 caches, since the requestor is the memory controller
999 out_msg.Requestor := machineID;
1000 out_msg.Destination.broadcast(MachineType:L1Cache);
1001 out_msg.MessageSize := MessageSizeType:Broadcast_Control;
1007 action(i_popIncomingRequestQueue, "i", desc="Pop incoming request queue") {
1008 requestQueue_in.dequeue();
1011 action(j_popIncomingUnblockQueue, "j", desc="Pop incoming unblock queue") {
1012 peek(unblockNetwork_in, ResponseMsg) {
1013 APPEND_TRANSITION_COMMENT(in_msg.Sender);
1015 unblockNetwork_in.dequeue();
1018 action(k_wakeUpDependents, "k", desc="wake-up dependents") {
1019 wakeUpBuffers(address);
1022 action(l_popMemQueue, "q", desc="Pop off-chip request queue") {
1023 memQueue_in.dequeue();
1026 action(g_popTriggerQueue, "g", desc="Pop trigger queue") {
1027 triggerQueue_in.dequeue();
1030 action(p_popDmaRequestQueue, "pd", desc="pop dma request queue") {
1031 dmaRequestQueue_in.dequeue();
1034 action(zd_stallAndWaitDMARequest, "zd", desc="Stall and wait the dma request queue") {
1035 peek(dmaRequestQueue_in, DMARequestMsg) {
1036 APPEND_TRANSITION_COMMENT(in_msg.Requestor);
1038 stall_and_wait(dmaRequestQueue_in, address);
1041 action(r_recordMemoryData, "rd", desc="record data from memory to TBE") {
1042 peek(memQueue_in, MemoryMsg) {
1043 assert(is_valid(tbe));
1044 if (tbe.CacheDirty == false) {
1045 tbe.DataBlk := in_msg.DataBlk;
1050 action(r_recordCacheData, "rc", desc="record data from cache response to TBE") {
1051 peek(responseToDir_in, ResponseMsg) {
1052 assert(is_valid(tbe));
1053 tbe.CacheDirty := true;
1054 tbe.DataBlk := in_msg.DataBlk;
1058 action(wr_writeResponseDataToMemory, "wr", desc="Write response data to memory") {
1059 peek(responseToDir_in, ResponseMsg) {
1060 getDirectoryEntry(address).DataBlk := in_msg.DataBlk;
1061 DPRINTF(RubySlicc, "Address: %s, Data Block: %s\n",
1062 in_msg.Address, in_msg.DataBlk);
1066 action(l_writeDataToMemory, "l", desc="Write PUTX/PUTO data to memory") {
1067 peek(unblockNetwork_in, ResponseMsg) {
1068 assert(in_msg.Dirty);
1069 assert(in_msg.MessageSize == MessageSizeType:Writeback_Data);
1070 getDirectoryEntry(address).DataBlk := in_msg.DataBlk;
1071 DPRINTF(RubySlicc, "Address: %s, Data Block: %s\n",
1072 in_msg.Address, in_msg.DataBlk);
1076 action(dwt_writeDmaDataFromTBE, "dwt", desc="DMA Write data to memory from TBE") {
1077 DPRINTF(RubySlicc, "%s\n", getDirectoryEntry(address).DataBlk);
1078 assert(is_valid(tbe));
1079 getDirectoryEntry(address).DataBlk := tbe.DataBlk;
1080 DPRINTF(RubySlicc, "%s\n", getDirectoryEntry(address).DataBlk);
1081 getDirectoryEntry(address).DataBlk.copyPartial(tbe.DmaDataBlk, addressOffset(tbe.PhysicalAddress), tbe.Len);
1082 DPRINTF(RubySlicc, "%s\n", getDirectoryEntry(address).DataBlk);
1085 action(wdt_writeDataFromTBE, "wdt", desc="DMA Write data to memory from TBE") {
1086 assert(is_valid(tbe));
1087 DPRINTF(RubySlicc, "%s\n", getDirectoryEntry(address).DataBlk);
1088 getDirectoryEntry(address).DataBlk := tbe.DataBlk;
1089 DPRINTF(RubySlicc, "%s\n", getDirectoryEntry(address).DataBlk);
1092 action(a_assertCacheData, "ac", desc="Assert that a cache provided the data") {
1093 assert(is_valid(tbe));
1094 assert(tbe.CacheDirty);
1097 action(ano_assertNotOwner, "ano", desc="Assert that request is not current owner") {
1098 if (probe_filter_enabled || full_bit_dir_enabled) {
1099 peek(requestQueue_in, RequestMsg) {
1100 assert(is_valid(cache_entry));
1101 assert(cache_entry.Owner != in_msg.Requestor);
1106 action(ans_assertNotSharer, "ans", desc="Assert that request is not a current sharer") {
1107 if (full_bit_dir_enabled) {
1108 peek(requestQueue_in, RequestMsg) {
1109 assert(cache_entry.Sharers.isElement(machineIDToNodeID(in_msg.Requestor)) == false);
1114 action(rs_removeSharer, "s", desc="remove current sharer") {
1115 if (full_bit_dir_enabled) {
1116 peek(unblockNetwork_in, ResponseMsg) {
1117 assert(cache_entry.Sharers.isElement(machineIDToNodeID(in_msg.Sender)));
1118 cache_entry.Sharers.remove(machineIDToNodeID(in_msg.Sender));
1123 action(cs_clearSharers, "cs", desc="clear current sharers") {
1124 if (full_bit_dir_enabled) {
1125 peek(requestQueue_in, RequestMsg) {
1126 cache_entry.Sharers.clear();
1127 cache_entry.Sharers.add(machineIDToNodeID(in_msg.Requestor));
1132 action(l_queueMemoryWBRequest, "lq", desc="Write PUTX data to memory") {
1133 peek(unblockNetwork_in, ResponseMsg) {
1134 enqueue(memQueue_out, MemoryMsg, latency="1") {
1135 out_msg.Address := address;
1136 out_msg.Type := MemoryRequestType:MEMORY_WB;
1137 DPRINTF(RubySlicc, "%s\n", out_msg);
1142 action(ld_queueMemoryDmaWrite, "ld", desc="Write DMA data to memory") {
1143 enqueue(memQueue_out, MemoryMsg, latency="1") {
1144 assert(is_valid(tbe));
1145 out_msg.Address := address;
1146 out_msg.Type := MemoryRequestType:MEMORY_WB;
1147 // first, initialize the data blk to the current version of system memory
1148 out_msg.DataBlk := tbe.DataBlk;
1149 // then add the dma write data
1150 out_msg.DataBlk.copyPartial(tbe.DmaDataBlk, addressOffset(tbe.PhysicalAddress), tbe.Len);
1151 DPRINTF(RubySlicc, "%s\n", out_msg);
1155 action(ll_checkIncomingWriteback, "\l", desc="Check PUTX/PUTO response message") {
1156 peek(unblockNetwork_in, ResponseMsg) {
1157 assert(in_msg.Dirty == false);
1158 assert(in_msg.MessageSize == MessageSizeType:Writeback_Control);
1160 // NOTE: The following check would not be valid in a real
1161 // implementation. We include the data in the "dataless"
1162 // message so we can assert the clean data matches the datablock
1164 assert(getDirectoryEntry(address).DataBlk == in_msg.DataBlk);
1168 action(z_stallAndWaitRequest, "z", desc="Recycle the request queue") {
1169 peek(requestQueue_in, RequestMsg) {
1170 APPEND_TRANSITION_COMMENT(in_msg.Requestor);
1172 stall_and_wait(requestQueue_in, address);
1177 // Transitions out of E state
1178 transition(E, GETX, NO_B_W) {
1179 pfa_probeFilterAllocate;
1181 rx_recordExclusiveInTBE;
1182 saa_setAcksToAllIfPF;
1183 qf_queueMemoryFetchRequest;
1184 fn_forwardRequestIfNecessary;
1185 i_popIncomingRequestQueue;
1188 transition(E, GETS, NO_B_W) {
1189 pfa_probeFilterAllocate;
1191 rx_recordExclusiveInTBE;
1192 saa_setAcksToAllIfPF;
1193 qf_queueMemoryFetchRequest;
1194 fn_forwardRequestIfNecessary;
1195 i_popIncomingRequestQueue;
1198 transition(E, DMA_READ, NO_DR_B_W) {
1199 vd_allocateDmaRequestInTBE;
1200 qd_queueMemoryRequestFromDmaRead;
1201 spa_setPendingAcksToZeroIfPF;
1202 f_forwardReadFromDma;
1203 p_popDmaRequestQueue;
1206 transition(E, DMA_WRITE, NO_DW_B_W) {
1207 vd_allocateDmaRequestInTBE;
1208 spa_setPendingAcksToZeroIfPF;
1209 sc_signalCompletionIfPF;
1210 f_forwardWriteFromDma;
1211 p_popDmaRequestQueue;
1214 // Transitions out of O state
1215 transition(O, GETX, NO_B_W) {
1220 qf_queueMemoryFetchRequest;
1221 fb_forwardRequestBcast;
1223 i_popIncomingRequestQueue;
1226 // This transition is dumb, if a shared copy exists on-chip, then that should
1227 // provide data, not slow off-chip dram. The problem is that the current
1228 // caches don't provide data in S state
1229 transition(O, GETS, O_B_W) {
1233 saa_setAcksToAllIfPF;
1234 qf_queueMemoryFetchRequest;
1235 fn_forwardRequestIfNecessary;
1236 i_popIncomingRequestQueue;
1239 transition(O, DMA_READ, O_DR_B_W) {
1240 vd_allocateDmaRequestInTBE;
1241 spa_setPendingAcksToZeroIfPF;
1242 qd_queueMemoryRequestFromDmaRead;
1243 f_forwardReadFromDma;
1244 p_popDmaRequestQueue;
1247 transition(O, Pf_Replacement, O_R) {
1249 pa_setPendingMsgsToAll;
1250 ia_invalidateAllRequest;
1251 pfd_probeFilterDeallocate;
1254 transition(S, Pf_Replacement, S_R) {
1256 pa_setPendingMsgsToAll;
1257 ia_invalidateAllRequest;
1258 pfd_probeFilterDeallocate;
1261 transition(NO, Pf_Replacement, NO_R) {
1263 po_setPendingMsgsToOne;
1264 io_invalidateOwnerRequest;
1265 pfd_probeFilterDeallocate;
1268 transition(NX, Pf_Replacement, NO_R) {
1270 pa_setPendingMsgsToAll;
1271 ia_invalidateAllRequest;
1272 pfd_probeFilterDeallocate;
1275 transition({O, S, NO, NX}, DMA_WRITE, NO_DW_B_W) {
1276 vd_allocateDmaRequestInTBE;
1277 f_forwardWriteFromDma;
1278 p_popDmaRequestQueue;
1281 // Transitions out of NO state
1282 transition(NX, GETX, NO_B) {
1284 fb_forwardRequestBcast;
1286 i_popIncomingRequestQueue;
1289 // Transitions out of NO state
1290 transition(NO, GETX, NO_B) {
1293 fc_forwardRequestConditionalOwner;
1295 i_popIncomingRequestQueue;
1298 transition(S, GETX, NO_B) {
1300 fb_forwardRequestBcast;
1302 i_popIncomingRequestQueue;
1305 transition(S, GETS, NO_B) {
1308 fb_forwardRequestBcast;
1309 i_popIncomingRequestQueue;
1312 transition(NO, GETS, NO_B) {
1315 ans_assertNotSharer;
1316 fc_forwardRequestConditionalOwner;
1317 i_popIncomingRequestQueue;
1320 transition(NX, GETS, NO_B) {
1323 fc_forwardRequestConditionalOwner;
1324 i_popIncomingRequestQueue;
1327 transition({NO, NX, S}, PUT, WB) {
1329 // note that the PUT requestor may not be the current owner if an invalidate
1333 i_popIncomingRequestQueue;
1336 transition({NO, NX, S}, DMA_READ, NO_DR_B_D) {
1337 vd_allocateDmaRequestInTBE;
1338 f_forwardReadFromDma;
1339 p_popDmaRequestQueue;
1342 // Nack PUT requests when races cause us to believe we own the data
1343 transition({O, E}, PUT) {
1344 b_sendWriteBackNack;
1345 i_popIncomingRequestQueue;
1348 // Blocked transient states
1349 transition({NO_B_X, O_B, NO_DR_B_W, NO_DW_B_W, NO_B_W, NO_DR_B_D,
1350 NO_DR_B, O_DR_B, O_B_W, O_DR_B_W, NO_DW_W, NO_B_S_W,
1351 NO_W, O_W, WB, WB_E_W, WB_O_W, O_R, S_R, NO_R},
1352 {GETS, GETX, PUT, Pf_Replacement}) {
1353 z_stallAndWaitRequest;
1356 transition(NO_B, GETX, NO_B_X) {
1357 z_stallAndWaitRequest;
1360 transition(NO_B, {PUT, Pf_Replacement}) {
1361 z_stallAndWaitRequest;
1364 transition(NO_B_S, {GETX, PUT, Pf_Replacement}) {
1365 z_stallAndWaitRequest;
1368 transition({NO_B_X, NO_B, NO_B_S, O_B, NO_DR_B_W, NO_DW_B_W, NO_B_W, NO_DR_B_D,
1369 NO_DR_B, O_DR_B, O_B_W, O_DR_B_W, NO_DW_W, NO_B_S_W,
1370 NO_W, O_W, WB, WB_E_W, WB_O_W, O_R, S_R, NO_R},
1371 {DMA_READ, DMA_WRITE}) {
1372 zd_stallAndWaitDMARequest;
1375 // merge GETS into one response
1376 transition(NO_B, GETS, NO_B_S) {
1378 rs_recordGetSRequestor;
1379 i_popIncomingRequestQueue;
1382 transition(NO_B_S, GETS) {
1383 rs_recordGetSRequestor;
1384 i_popIncomingRequestQueue;
1387 // unblock responses
1388 transition({NO_B, NO_B_X}, UnblockS, NX) {
1389 us_updateSharerIfFBD;
1391 j_popIncomingUnblockQueue;
1394 transition({NO_B, NO_B_X}, UnblockM, NO) {
1396 us_updateSharerIfFBD;
1398 j_popIncomingUnblockQueue;
1401 transition(NO_B_S, UnblockS, NO_B_S_W) {
1402 us_updateSharerIfFBD;
1403 fr_forwardMergeReadRequestsToOwner;
1404 sp_setPendingMsgsToMergedSharers;
1405 j_popIncomingUnblockQueue;
1408 transition(NO_B_S, UnblockM, NO_B_S_W) {
1410 fr_forwardMergeReadRequestsToOwner;
1411 sp_setPendingMsgsToMergedSharers;
1412 j_popIncomingUnblockQueue;
1415 transition(NO_B_S_W, UnblockS) {
1416 us_updateSharerIfFBD;
1417 mu_decrementNumberOfUnblocks;
1418 os_checkForMergedGetSCompletion;
1419 j_popIncomingUnblockQueue;
1422 transition(NO_B_S_W, All_Unblocks, NX) {
1428 transition(O_B, UnblockS, O) {
1429 us_updateSharerIfFBD;
1431 j_popIncomingUnblockQueue;
1434 transition(O_B, UnblockM, NO) {
1435 us_updateSharerIfFBD;
1438 j_popIncomingUnblockQueue;
1441 transition(NO_B_W, Memory_Data, NO_B) {
1447 transition(NO_DR_B_W, Memory_Data, NO_DR_B) {
1449 o_checkForCompletion;
1453 transition(O_DR_B_W, Memory_Data, O_DR_B) {
1456 o_checkForCompletion;
1460 transition({NO_DR_B, O_DR_B, NO_DR_B_D, NO_DW_B_W}, Ack) {
1461 m_decrementNumberOfMessages;
1462 o_checkForCompletion;
1466 transition({O_R, S_R, NO_R}, Ack) {
1467 m_decrementNumberOfMessages;
1468 o_checkForCompletion;
1472 transition(S_R, Data) {
1473 wr_writeResponseDataToMemory;
1474 m_decrementNumberOfMessages;
1475 o_checkForCompletion;
1479 transition(NO_R, {Data, Exclusive_Data}) {
1480 wr_writeResponseDataToMemory;
1481 m_decrementNumberOfMessages;
1482 o_checkForCompletion;
1486 transition({O_R, S_R, NO_R}, All_acks_and_data_no_sharers, E) {
1492 transition({NO_DR_B_W, O_DR_B_W}, Ack) {
1493 m_decrementNumberOfMessages;
1497 transition(NO_DR_B_W, Shared_Ack) {
1498 m_decrementNumberOfMessages;
1503 transition(O_DR_B, Shared_Ack) {
1504 m_decrementNumberOfMessages;
1506 o_checkForCompletion;
1510 transition(O_DR_B_W, Shared_Ack) {
1511 m_decrementNumberOfMessages;
1516 transition({NO_DR_B, NO_DR_B_D}, Shared_Ack) {
1517 m_decrementNumberOfMessages;
1519 o_checkForCompletion;
1523 transition(NO_DR_B_W, Shared_Data) {
1525 m_decrementNumberOfMessages;
1527 o_checkForCompletion;
1531 transition({NO_DR_B, NO_DR_B_D}, Shared_Data) {
1533 m_decrementNumberOfMessages;
1535 o_checkForCompletion;
1539 transition(NO_DR_B_W, {Exclusive_Data, Data}) {
1541 m_decrementNumberOfMessages;
1545 transition({NO_DR_B, NO_DR_B_D, NO_DW_B_W}, {Exclusive_Data, Data}) {
1547 m_decrementNumberOfMessages;
1548 o_checkForCompletion;
1552 transition(NO_DR_B, All_acks_and_owner_data, O) {
1554 // Note that the DMA consistency model allows us to send the DMA device
1555 // a response as soon as we receive valid data and prior to receiving
1556 // all acks. However, to simplify the protocol we wait for all acks.
1558 dt_sendDmaDataFromTbe;
1559 wdt_writeDataFromTBE;
1565 transition(NO_DR_B, All_acks_and_shared_data, S) {
1567 // Note that the DMA consistency model allows us to send the DMA device
1568 // a response as soon as we receive valid data and prior to receiving
1569 // all acks. However, to simplify the protocol we wait for all acks.
1571 dt_sendDmaDataFromTbe;
1572 wdt_writeDataFromTBE;
1578 transition(NO_DR_B_D, All_acks_and_owner_data, O) {
1580 // Note that the DMA consistency model allows us to send the DMA device
1581 // a response as soon as we receive valid data and prior to receiving
1582 // all acks. However, to simplify the protocol we wait for all acks.
1584 dt_sendDmaDataFromTbe;
1585 wdt_writeDataFromTBE;
1591 transition(NO_DR_B_D, All_acks_and_shared_data, S) {
1593 // Note that the DMA consistency model allows us to send the DMA device
1594 // a response as soon as we receive valid data and prior to receiving
1595 // all acks. However, to simplify the protocol we wait for all acks.
1597 dt_sendDmaDataFromTbe;
1598 wdt_writeDataFromTBE;
1604 transition(O_DR_B, All_acks_and_owner_data, O) {
1605 wdt_writeDataFromTBE;
1611 transition(O_DR_B, All_acks_and_data_no_sharers, E) {
1612 wdt_writeDataFromTBE;
1614 pfd_probeFilterDeallocate;
1619 transition(NO_DR_B, All_acks_and_data_no_sharers, E) {
1621 // Note that the DMA consistency model allows us to send the DMA device
1622 // a response as soon as we receive valid data and prior to receiving
1623 // all acks. However, to simplify the protocol we wait for all acks.
1625 dt_sendDmaDataFromTbe;
1626 wdt_writeDataFromTBE;
1628 ppfd_possibleProbeFilterDeallocate;
1633 transition(NO_DR_B_D, All_acks_and_data_no_sharers, E) {
1636 // Note that the DMA consistency model allows us to send the DMA device
1637 // a response as soon as we receive valid data and prior to receiving
1638 // all acks. However, to simplify the protocol we wait for all acks.
1640 dt_sendDmaDataFromTbe;
1641 wdt_writeDataFromTBE;
1643 ppfd_possibleProbeFilterDeallocate;
1648 transition(NO_DW_B_W, All_acks_and_data_no_sharers, NO_DW_W) {
1649 dwt_writeDmaDataFromTBE;
1650 ld_queueMemoryDmaWrite;
1654 transition(NO_DW_W, Memory_Ack, E) {
1657 ppfd_possibleProbeFilterDeallocate;
1662 transition(O_B_W, Memory_Data, O_B) {
1668 transition(NO_B_W, UnblockM, NO_W) {
1670 j_popIncomingUnblockQueue;
1673 transition(NO_B_W, UnblockS, NO_W) {
1674 us_updateSharerIfFBD;
1675 j_popIncomingUnblockQueue;
1678 transition(O_B_W, UnblockS, O_W) {
1679 us_updateSharerIfFBD;
1680 j_popIncomingUnblockQueue;
1683 transition(NO_W, Memory_Data, NO) {
1689 transition(O_W, Memory_Data, O) {
1695 // WB State Transistions
1696 transition(WB, Writeback_Dirty, WB_O_W) {
1697 l_writeDataToMemory;
1699 l_queueMemoryWBRequest;
1700 j_popIncomingUnblockQueue;
1703 transition(WB, Writeback_Exclusive_Dirty, WB_E_W) {
1704 l_writeDataToMemory;
1706 l_queueMemoryWBRequest;
1707 j_popIncomingUnblockQueue;
1710 transition(WB_E_W, Memory_Ack, E) {
1711 pfd_probeFilterDeallocate;
1716 transition(WB_O_W, Memory_Ack, O) {
1721 transition(WB, Writeback_Clean, O) {
1722 ll_checkIncomingWriteback;
1725 j_popIncomingUnblockQueue;
1728 transition(WB, Writeback_Exclusive_Clean, E) {
1729 ll_checkIncomingWriteback;
1731 pfd_probeFilterDeallocate;
1733 j_popIncomingUnblockQueue;
1736 transition(WB, Unblock, NX) {
1737 auno_assertUnblockerNotOwner;
1739 j_popIncomingUnblockQueue;