2 * Copyright (c) 2007 MIPS Technologies, Inc.
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are
7 * met: redistributions of source code must retain the above copyright
8 * notice, this list of conditions and the following disclaimer;
9 * redistributions in binary form must reproduce the above copyright
10 * notice, this list of conditions and the following disclaimer in the
11 * documentation and/or other materials provided with the distribution;
12 * neither the name of the copyright holders nor the names of its
13 * contributors may be used to endorse or promote products derived from
14 * this software without specific prior written permission.
16 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
17 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
18 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
19 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
20 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 * Authors: Korey Sewell
32 #ifndef __CPU_INORDER_CPU_HH__
33 #define __CPU_INORDER_CPU_HH__
41 #include "arch/isa_traits.hh"
42 #include "arch/types.hh"
43 #include "arch/registers.hh"
44 #include "base/statistics.hh"
45 #include "cpu/timebuf.hh"
46 #include "base/types.hh"
47 #include "config/full_system.hh"
48 #include "config/the_isa.hh"
49 #include "cpu/activity.hh"
50 #include "cpu/base.hh"
51 #include "cpu/simple_thread.hh"
52 #include "cpu/inorder/inorder_dyn_inst.hh"
53 #include "cpu/inorder/pipeline_traits.hh"
54 #include "cpu/inorder/pipeline_stage.hh"
55 #include "cpu/inorder/thread_state.hh"
56 #include "cpu/inorder/reg_dep_map.hh"
57 #include "cpu/o3/dep_graph.hh"
58 #include "cpu/o3/rename_map.hh"
59 #include "mem/packet.hh"
60 #include "mem/port.hh"
61 #include "mem/request.hh"
62 #include "sim/eventq.hh"
63 #include "sim/process.hh"
71 class InOrderCPU : public BaseCPU
75 typedef ThePipeline::Params Params;
76 typedef InOrderThreadState Thread;
79 typedef TheISA::IntReg IntReg;
80 typedef TheISA::FloatReg FloatReg;
81 typedef TheISA::FloatRegBits FloatRegBits;
82 typedef TheISA::MiscReg MiscReg;
85 typedef ThePipeline::DynInstPtr DynInstPtr;
86 typedef std::list<DynInstPtr>::iterator ListIt;
89 typedef TimeBuffer<InterStageStruct> StageQueue;
91 friend class Resource;
94 /** Constructs a CPU with the given parameters. */
95 InOrderCPU(Params *params);
103 ThreadID asid[ThePipeline::MaxThreads];
105 /** Type of core that this is */
106 std::string coreType;
108 // Only need for SE MODE
115 ThreadModel threadModel;
117 int readCpuId() { return cpu_id; }
119 void setCpuId(int val) { cpu_id = val; }
132 /** Overall CPU status. */
135 /** Define TickEvent for the CPU */
136 class TickEvent : public Event
139 /** Pointer to the CPU. */
143 /** Constructs a tick event. */
144 TickEvent(InOrderCPU *c);
146 /** Processes a tick event, calling tick() on the CPU. */
149 /** Returns the description of the tick event. */
150 const char *description();
153 /** The tick event used for scheduling CPU ticks. */
156 /** Schedule tick event, regardless of its current state. */
157 void scheduleTickEvent(int delay)
159 assert(!tickEvent.scheduled() || tickEvent.squashed());
160 reschedule(&tickEvent, nextCycle(curTick() + ticks(delay)), true);
163 /** Unschedule tick event, regardless of its current state. */
164 void unscheduleTickEvent()
166 if (tickEvent.scheduled())
171 // List of Events That can be scheduled from
173 // NOTE(1): The Resource Pool also uses this event list
174 // to schedule events broadcast to all resources interfaces
175 // NOTE(2): CPU Events usually need to schedule a corresponding resource
179 ActivateNextReadyThread,
190 static std::string eventNames[NumCPUEvents];
192 /** Define CPU Event */
193 class CPUEvent : public Event
199 CPUEventType cpuEventType;
206 /** Constructs a CPU event. */
207 CPUEvent(InOrderCPU *_cpu, CPUEventType e_type, Fault fault,
208 ThreadID _tid, DynInstPtr inst, unsigned event_pri_offset);
210 /** Set Type of Event To Be Scheduled */
211 void setEvent(CPUEventType e_type, Fault _fault, ThreadID _tid,
215 cpuEventType = e_type;
221 /** Processes a CPU event. */
224 /** Returns the description of the CPU event. */
225 const char *description();
227 /** Schedule Event */
228 void scheduleEvent(int delay);
230 /** Unschedule This Event */
231 void unscheduleEvent();
234 /** Schedule a CPU Event */
235 void scheduleCpuEvent(CPUEventType cpu_event, Fault fault, ThreadID tid,
236 DynInstPtr inst, unsigned delay = 0,
237 unsigned event_pri_offset = 0);
240 /** Interface between the CPU and CPU resources. */
241 ResourcePool *resPool;
243 /** Instruction used to signify that there is no *real* instruction in
245 DynInstPtr dummyInst[ThePipeline::MaxThreads];
246 DynInstPtr dummyBufferInst;
247 DynInstPtr dummyReqInst;
249 /** Used by resources to signify a denied access to a resource. */
250 ResourceRequest *dummyReq[ThePipeline::MaxThreads];
252 /** Identifies the resource id that identifies a fetch
255 unsigned fetchPortIdx;
257 /** Identifies the resource id that identifies a ITB */
260 /** Identifies the resource id that identifies a data
263 unsigned dataPortIdx;
265 /** Identifies the resource id that identifies a DTB */
268 /** The Pipeline Stages for the CPU */
269 PipelineStage *pipelineStage[ThePipeline::NumStages];
271 /** Width (processing bandwidth) of each stage */
274 /** Program Counters */
275 TheISA::PCState pc[ThePipeline::MaxThreads];
277 /** The Register File for the CPU */
279 FloatReg f[ThePipeline::MaxThreads][TheISA::NumFloatRegs];
280 FloatRegBits i[ThePipeline::MaxThreads][TheISA::NumFloatRegs];
282 TheISA::IntReg intRegs[ThePipeline::MaxThreads][TheISA::NumIntRegs];
285 TheISA::ISA isa[ThePipeline::MaxThreads];
287 /** Dependency Tracker for Integer & Floating Point Regs */
288 RegDepMap archRegDepMap[ThePipeline::MaxThreads];
290 /** Global communication structure */
291 TimeBuffer<TimeStruct> timeBuffer;
293 /** Communication structure that sits in between pipeline stages */
294 StageQueue *stageQueue[ThePipeline::NumStages-1];
296 TheISA::TLB *getITBPtr();
297 TheISA::TLB *getDTBPtr();
299 /** Accessor Type for the SkedCache */
300 typedef uint32_t SkedID;
302 /** Cache of Instruction Schedule using the instruction's name as a key */
303 static std::map<SkedID, ThePipeline::RSkedPtr> skedCache;
305 typedef std::map<SkedID, ThePipeline::RSkedPtr>::iterator SkedCacheIt;
307 /** Initialized to last iterator in map, signifying a invalid entry
310 SkedCacheIt endOfSkedIt;
312 ThePipeline::RSkedPtr frontEndSked;
314 /** Add a new instruction schedule to the schedule cache */
315 void addToSkedCache(DynInstPtr inst, ThePipeline::RSkedPtr inst_sked)
317 SkedID sked_id = genSkedID(inst);
318 assert(skedCache.find(sked_id) == skedCache.end());
319 skedCache[sked_id] = inst_sked;
323 /** Find a instruction schedule */
324 ThePipeline::RSkedPtr lookupSked(DynInstPtr inst)
326 SkedID sked_id = genSkedID(inst);
327 SkedCacheIt lookup_it = skedCache.find(sked_id);
329 if (lookup_it != endOfSkedIt) {
330 return (*lookup_it).second;
336 static const uint8_t INST_OPCLASS = 26;
337 static const uint8_t INST_LOAD = 25;
338 static const uint8_t INST_STORE = 24;
339 static const uint8_t INST_CONTROL = 23;
340 static const uint8_t INST_NONSPEC = 22;
341 static const uint8_t INST_DEST_REGS = 18;
342 static const uint8_t INST_SRC_REGS = 14;
344 inline SkedID genSkedID(DynInstPtr inst)
347 id = (inst->opClass() << INST_OPCLASS) |
348 (inst->isLoad() << INST_LOAD) |
349 (inst->isStore() << INST_STORE) |
350 (inst->isControl() << INST_CONTROL) |
351 (inst->isNonSpeculative() << INST_NONSPEC) |
352 (inst->numDestRegs() << INST_DEST_REGS) |
353 (inst->numSrcRegs() << INST_SRC_REGS);
357 ThePipeline::RSkedPtr createFrontEndSked();
358 ThePipeline::RSkedPtr createBackEndSked(DynInstPtr inst);
360 class StageScheduler {
362 ThePipeline::RSkedPtr rsked;
364 int nextTaskPriority;
367 StageScheduler(ThePipeline::RSkedPtr _rsked, int stage_num)
368 : rsked(_rsked), stageNum(stage_num),
372 void needs(int unit, int request) {
373 rsked->push(new ScheduleEntry(
374 stageNum, nextTaskPriority++, unit, request
378 void needs(int unit, int request, int param) {
379 rsked->push(new ScheduleEntry(
380 stageNum, nextTaskPriority++, unit, request, param
387 /** Registers statistics. */
390 /** Ticks CPU, calling tick() on each stage, and checking the overall
391 * activity to see if the CPU should deschedule itself.
395 /** Initialize the CPU */
398 /** Reset State in the CPU */
401 /** Get a Memory Port */
402 Port* getPort(const std::string &if_name, int idx = 0);
405 /** HW return from error interrupt. */
406 Fault hwrei(ThreadID tid);
408 bool simPalCheck(int palFunc, ThreadID tid);
410 /** Returns the Fault for any valid interrupt. */
411 Fault getInterrupts();
413 /** Processes any an interrupt fault. */
414 void processInterrupts(Fault interrupt);
416 /** Halts the CPU. */
417 void halt() { panic("Halt not implemented!\n"); }
419 /** Update the Virt and Phys ports of all ThreadContexts to
420 * reflect change in memory connections. */
421 void updateMemPorts();
423 /** Check if this address is a valid instruction address. */
424 bool validInstAddr(Addr addr) { return true; }
426 /** Check if this address is a valid data address. */
427 bool validDataAddr(Addr addr) { return true; }
430 /** trap() - sets up a trap event on the cpuTraps to handle given fault.
431 * trapCPU() - Traps to handle given fault
433 void trap(Fault fault, ThreadID tid, DynInstPtr inst, int delay = 0);
434 void trapCPU(Fault fault, ThreadID tid, DynInstPtr inst);
436 /** Add Thread to Active Threads List. */
437 void activateContext(ThreadID tid, int delay = 0);
438 void activateThread(ThreadID tid);
439 void activateThreadInPipeline(ThreadID tid);
441 /** Add Thread to Active Threads List. */
442 void activateNextReadyContext(int delay = 0);
443 void activateNextReadyThread();
445 /** Remove from Active Thread List */
446 void deactivateContext(ThreadID tid, int delay = 0);
447 void deactivateThread(ThreadID tid);
449 /** Suspend Thread, Remove from Active Threads List, Add to Suspend List */
450 void suspendContext(ThreadID tid, int delay = 0);
451 void suspendThread(ThreadID tid);
453 /** Halt Thread, Remove from Active Thread List, Place Thread on Halted
456 void haltContext(ThreadID tid, int delay = 0);
457 void haltThread(ThreadID tid);
459 /** squashFromMemStall() - sets up a squash event
460 * squashDueToMemStall() - squashes pipeline
461 * @note: maybe squashContext/squashThread would be better?
463 void squashFromMemStall(DynInstPtr inst, ThreadID tid, int delay = 0);
464 void squashDueToMemStall(int stage_num, InstSeqNum seq_num, ThreadID tid);
466 void removePipelineStalls(ThreadID tid);
467 void squashThreadInPipeline(ThreadID tid);
468 void squashBehindMemStall(int stage_num, InstSeqNum seq_num, ThreadID tid);
470 PipelineStage* getPipeStage(int stage_num);
475 hack_once("return a bogus context id");
479 /** Update The Order In Which We Process Threads. */
480 void updateThreadPriority();
482 /** Switches a Pipeline Stage to Active. (Unused currently) */
483 void switchToActive(int stage_idx)
484 { /*pipelineStage[stage_idx]->switchToActive();*/ }
486 /** Get the current instruction sequence number, and increment it. */
487 InstSeqNum getAndIncrementInstSeq(ThreadID tid)
488 { return globalSeqNum[tid]++; }
490 /** Get the current instruction sequence number, and increment it. */
491 InstSeqNum nextInstSeqNum(ThreadID tid)
492 { return globalSeqNum[tid]; }
494 /** Increment Instruction Sequence Number */
495 void incrInstSeqNum(ThreadID tid)
496 { globalSeqNum[tid]++; }
498 /** Set Instruction Sequence Number */
499 void setInstSeqNum(ThreadID tid, InstSeqNum seq_num)
501 globalSeqNum[tid] = seq_num;
504 /** Get & Update Next Event Number */
505 InstSeqNum getNextEventNum()
508 return cpuEventNum++;
514 /** Register file accessors */
515 uint64_t readIntReg(int reg_idx, ThreadID tid);
517 FloatReg readFloatReg(int reg_idx, ThreadID tid);
519 FloatRegBits readFloatRegBits(int reg_idx, ThreadID tid);
521 void setIntReg(int reg_idx, uint64_t val, ThreadID tid);
523 void setFloatReg(int reg_idx, FloatReg val, ThreadID tid);
525 void setFloatRegBits(int reg_idx, FloatRegBits val, ThreadID tid);
527 /** Reads a miscellaneous register. */
528 MiscReg readMiscRegNoEffect(int misc_reg, ThreadID tid = 0);
530 /** Reads a misc. register, including any side effects the read
531 * might have as defined by the architecture.
533 MiscReg readMiscReg(int misc_reg, ThreadID tid = 0);
535 /** Sets a miscellaneous register. */
536 void setMiscRegNoEffect(int misc_reg, const MiscReg &val,
539 /** Sets a misc. register, including any side effects the write
540 * might have as defined by the architecture.
542 void setMiscReg(int misc_reg, const MiscReg &val, ThreadID tid = 0);
544 /** Reads a int/fp/misc reg. from another thread depending on ISA-defined
547 uint64_t readRegOtherThread(unsigned misc_reg,
548 ThreadID tid = InvalidThreadID);
550 /** Sets a int/fp/misc reg. from another thread depending on an ISA-defined
553 void setRegOtherThread(unsigned misc_reg, const MiscReg &val,
556 /** Reads the commit PC of a specific thread. */
558 pcState(ThreadID tid)
563 /** Sets the commit PC of a specific thread. */
565 pcState(const TheISA::PCState &newPC, ThreadID tid)
570 Addr instAddr(ThreadID tid) { return pc[tid].instAddr(); }
571 Addr nextInstAddr(ThreadID tid) { return pc[tid].nextInstAddr(); }
572 MicroPC microPC(ThreadID tid) { return pc[tid].microPC(); }
574 /** Function to add instruction onto the head of the list of the
575 * instructions. Used when new instructions are fetched.
577 ListIt addInst(DynInstPtr &inst);
579 /** Function to tell the CPU that an instruction has completed. */
580 void instDone(DynInstPtr inst, ThreadID tid);
582 /** Add Instructions to the CPU Remove List*/
583 void addToRemoveList(DynInstPtr &inst);
585 /** Remove an instruction from CPU */
586 void removeInst(DynInstPtr &inst);
588 /** Remove all instructions younger than the given sequence number. */
589 void removeInstsUntil(const InstSeqNum &seq_num,ThreadID tid);
591 /** Removes the instruction pointed to by the iterator. */
592 inline void squashInstIt(const ListIt &instIt, ThreadID tid);
594 /** Cleans up all instructions on the instruction remove list. */
595 void cleanUpRemovedInsts();
597 /** Cleans up all events on the CPU event remove list. */
598 void cleanUpRemovedEvents();
600 /** Debug function to print all instructions on the list. */
603 /** Forwards an instruction read to the appropriate data
604 * resource (indexes into Resource Pool thru "dataPortIdx")
606 Fault read(DynInstPtr inst, Addr addr,
607 uint8_t *data, unsigned size, unsigned flags);
609 /** Forwards an instruction write. to the appropriate data
610 * resource (indexes into Resource Pool thru "dataPortIdx")
612 Fault write(DynInstPtr inst, uint8_t *data, unsigned size,
613 Addr addr, unsigned flags, uint64_t *write_res = NULL);
615 /** Executes a syscall.*/
616 void syscall(int64_t callnum, ThreadID tid);
619 /** Per-Thread List of all the instructions in flight. */
620 std::list<DynInstPtr> instList[ThePipeline::MaxThreads];
622 /** List of all the instructions that will be removed at the end of this
625 std::queue<ListIt> removeList;
627 /** List of all the cpu event requests that will be removed at the end of
630 std::queue<Event*> cpuEventRemoveList;
632 /** Records if instructions need to be removed this cycle due to
633 * being retired or squashed.
635 bool removeInstsThisCycle;
637 /** True if there is non-speculative Inst Active In Pipeline. Lets any
638 * execution unit know, NOT to execute while the instruction is active.
640 bool nonSpecInstActive[ThePipeline::MaxThreads];
642 /** Instruction Seq. Num of current non-speculative instruction. */
643 InstSeqNum nonSpecSeqNum[ThePipeline::MaxThreads];
645 /** Instruction Seq. Num of last instruction squashed in pipeline */
646 InstSeqNum squashSeqNum[ThePipeline::MaxThreads];
648 /** Last Cycle that the CPU squashed instruction end. */
649 Tick lastSquashCycle[ThePipeline::MaxThreads];
651 std::list<ThreadID> fetchPriorityList;
654 /** Active Threads List */
655 std::list<ThreadID> activeThreads;
657 /** Ready Threads List */
658 std::list<ThreadID> readyThreads;
660 /** Suspended Threads List */
661 std::list<ThreadID> suspendedThreads;
663 /** Halted Threads List */
664 std::list<ThreadID> haltedThreads;
666 /** Thread Status Functions */
667 bool isThreadActive(ThreadID tid);
668 bool isThreadReady(ThreadID tid);
669 bool isThreadSuspended(ThreadID tid);
672 /** The activity recorder; used to tell if the CPU has any
673 * activity remaining or if it can go to idle and deschedule
676 ActivityRecorder activityRec;
679 /** Number of Active Threads in the CPU */
680 ThreadID numActiveThreads() { return activeThreads.size(); }
682 /** Thread id of active thread
683 * Only used for SwitchOnCacheMiss model.
684 * Assumes only 1 thread active
686 ThreadID activeThreadId()
688 if (numActiveThreads() > 0)
689 return activeThreads.front();
691 return InvalidThreadID;
695 /** Records that there was time buffer activity this cycle. */
696 void activityThisCycle() { activityRec.activity(); }
698 /** Changes a stage's status to active within the activity recorder. */
699 void activateStage(const int idx)
700 { activityRec.activateStage(idx); }
702 /** Changes a stage's status to inactive within the activity recorder. */
703 void deactivateStage(const int idx)
704 { activityRec.deactivateStage(idx); }
706 /** Wakes the CPU, rescheduling the CPU if it's not already active. */
710 virtual void wakeup();
713 // LL/SC debug functionality
714 unsigned stCondFails;
716 unsigned readStCondFailures()
717 { return stCondFails; }
719 unsigned setStCondFailures(unsigned st_fails)
720 { return stCondFails = st_fails; }
722 /** Returns a pointer to a thread context. */
723 ThreadContext *tcBase(ThreadID tid = 0)
725 return thread[tid]->getTC();
728 /** Count the Total Instructions Committed in the CPU. */
729 virtual Counter totalInstructions() const
733 for (ThreadID tid = 0; tid < (ThreadID)thread.size(); tid++)
734 total += thread[tid]->numInst;
740 /** Pointer to the system. */
743 /** Pointer to physical memory. */
744 PhysicalMemory *physmem;
747 /** The global sequence number counter. */
748 InstSeqNum globalSeqNum[ThePipeline::MaxThreads];
751 /** The global event number counter. */
752 InstSeqNum cpuEventNum;
754 /** Number of resource requests active in CPU **/
755 unsigned resReqCount;
758 /** Counter of how many stages have completed switching out. */
761 /** Pointers to all of the threads in the CPU. */
762 std::vector<Thread *> thread;
764 /** Pointer to the icache interface. */
765 MemInterface *icacheInterface;
767 /** Pointer to the dcache interface. */
768 MemInterface *dcacheInterface;
770 /** Whether or not the CPU should defer its registration. */
771 bool deferRegistration;
773 /** Per-Stage Instruction Tracing */
776 /** The cycle that the CPU was last running, used for statistics. */
777 Tick lastRunningCycle;
779 void updateContextSwitchStats();
780 unsigned instsPerSwitch;
781 Stats::Average instsPerCtxtSwitch;
782 Stats::Scalar numCtxtSwitches;
784 /** Update Thread , used for statistic purposes*/
785 inline void tickThreadStats();
787 /** Per-Thread Tick */
788 Stats::Vector threadCycles;
791 Stats::Scalar smtCycles;
793 /** Stat for total number of times the CPU is descheduled. */
794 Stats::Scalar timesIdled;
796 /** Stat for total number of cycles the CPU spends descheduled or no
799 Stats::Scalar idleCycles;
801 /** Stat for total number of cycles the CPU is active. */
802 Stats::Scalar runCycles;
804 /** Percentage of cycles a stage was active */
805 Stats::Formula activity;
807 /** Instruction Mix Stats */
808 Stats::Scalar comLoads;
809 Stats::Scalar comStores;
810 Stats::Scalar comBranches;
811 Stats::Scalar comNops;
812 Stats::Scalar comNonSpec;
813 Stats::Scalar comInts;
814 Stats::Scalar comFloats;
816 /** Stat for the number of committed instructions per thread. */
817 Stats::Vector committedInsts;
819 /** Stat for the number of committed instructions per thread. */
820 Stats::Vector smtCommittedInsts;
822 /** Stat for the total number of committed instructions. */
823 Stats::Scalar totalCommittedInsts;
825 /** Stat for the CPI per thread. */
828 /** Stat for the SMT-CPI per thread. */
829 Stats::Formula smtCpi;
831 /** Stat for the total CPI. */
832 Stats::Formula totalCpi;
834 /** Stat for the IPC per thread. */
837 /** Stat for the total IPC. */
838 Stats::Formula smtIpc;
840 /** Stat for the total IPC. */
841 Stats::Formula totalIpc;
844 #endif // __CPU_O3_CPU_HH__