cpu: Remove unused deallocateContext calls
[gem5.git] / src / cpu / simple / base.cc
1 /*
2 * Copyright (c) 2010-2012 ARM Limited
3 * Copyright (c) 2013 Advanced Micro Devices, Inc.
4 * All rights reserved
5 *
6 * The license below extends only to copyright in the software and shall
7 * not be construed as granting a license to any other intellectual
8 * property including but not limited to intellectual property relating
9 * to a hardware implementation of the functionality of the software
10 * licensed hereunder. You may use the software subject to the license
11 * terms below provided that you ensure that this notice is replicated
12 * unmodified and in its entirety in all distributions of the software,
13 * modified or unmodified, in source code or in binary form.
14 *
15 * Copyright (c) 2002-2005 The Regents of The University of Michigan
16 * All rights reserved.
17 *
18 * Redistribution and use in source and binary forms, with or without
19 * modification, are permitted provided that the following conditions are
20 * met: redistributions of source code must retain the above copyright
21 * notice, this list of conditions and the following disclaimer;
22 * redistributions in binary form must reproduce the above copyright
23 * notice, this list of conditions and the following disclaimer in the
24 * documentation and/or other materials provided with the distribution;
25 * neither the name of the copyright holders nor the names of its
26 * contributors may be used to endorse or promote products derived from
27 * this software without specific prior written permission.
28 *
29 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
30 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
31 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
32 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
33 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
34 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
35 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
36 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
37 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
38 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
39 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
40 *
41 * Authors: Steve Reinhardt
42 */
43
44 #include "arch/kernel_stats.hh"
45 #include "arch/stacktrace.hh"
46 #include "arch/tlb.hh"
47 #include "arch/utility.hh"
48 #include "arch/vtophys.hh"
49 #include "base/loader/symtab.hh"
50 #include "base/cp_annotate.hh"
51 #include "base/cprintf.hh"
52 #include "base/inifile.hh"
53 #include "base/misc.hh"
54 #include "base/pollevent.hh"
55 #include "base/trace.hh"
56 #include "base/types.hh"
57 #include "config/the_isa.hh"
58 #include "cpu/simple/base.hh"
59 #include "cpu/base.hh"
60 #include "cpu/checker/cpu.hh"
61 #include "cpu/checker/thread_context.hh"
62 #include "cpu/exetrace.hh"
63 #include "cpu/pred/bpred_unit.hh"
64 #include "cpu/profile.hh"
65 #include "cpu/simple_thread.hh"
66 #include "cpu/smt.hh"
67 #include "cpu/static_inst.hh"
68 #include "cpu/thread_context.hh"
69 #include "debug/Decode.hh"
70 #include "debug/Fetch.hh"
71 #include "debug/Quiesce.hh"
72 #include "mem/mem_object.hh"
73 #include "mem/packet.hh"
74 #include "mem/request.hh"
75 #include "params/BaseSimpleCPU.hh"
76 #include "sim/byteswap.hh"
77 #include "sim/debug.hh"
78 #include "sim/faults.hh"
79 #include "sim/full_system.hh"
80 #include "sim/sim_events.hh"
81 #include "sim/sim_object.hh"
82 #include "sim/stats.hh"
83 #include "sim/system.hh"
84
85 using namespace std;
86 using namespace TheISA;
87
88 BaseSimpleCPU::BaseSimpleCPU(BaseSimpleCPUParams *p)
89 : BaseCPU(p),
90 branchPred(p->branchPred),
91 traceData(NULL), thread(NULL)
92 {
93 if (FullSystem)
94 thread = new SimpleThread(this, 0, p->system, p->itb, p->dtb,
95 p->isa[0]);
96 else
97 thread = new SimpleThread(this, /* thread_num */ 0, p->system,
98 p->workload[0], p->itb, p->dtb, p->isa[0]);
99
100 thread->setStatus(ThreadContext::Halted);
101
102 tc = thread->getTC();
103
104 if (p->checker) {
105 BaseCPU *temp_checker = p->checker;
106 checker = dynamic_cast<CheckerCPU *>(temp_checker);
107 checker->setSystem(p->system);
108 // Manipulate thread context
109 ThreadContext *cpu_tc = tc;
110 tc = new CheckerThreadContext<ThreadContext>(cpu_tc, this->checker);
111 } else {
112 checker = NULL;
113 }
114
115 numInst = 0;
116 startNumInst = 0;
117 numOp = 0;
118 startNumOp = 0;
119 numLoad = 0;
120 startNumLoad = 0;
121 lastIcacheStall = 0;
122 lastDcacheStall = 0;
123
124 threadContexts.push_back(tc);
125
126
127 fetchOffset = 0;
128 stayAtPC = false;
129 }
130
131 BaseSimpleCPU::~BaseSimpleCPU()
132 {
133 }
134
135 void
136 BaseSimpleCPU::haltContext(ThreadID thread_num)
137 {
138 // for now, these are equivalent
139 suspendContext(thread_num);
140 }
141
142
143 void
144 BaseSimpleCPU::regStats()
145 {
146 using namespace Stats;
147
148 BaseCPU::regStats();
149
150 numInsts
151 .name(name() + ".committedInsts")
152 .desc("Number of instructions committed")
153 ;
154
155 numOps
156 .name(name() + ".committedOps")
157 .desc("Number of ops (including micro ops) committed")
158 ;
159
160 numIntAluAccesses
161 .name(name() + ".num_int_alu_accesses")
162 .desc("Number of integer alu accesses")
163 ;
164
165 numFpAluAccesses
166 .name(name() + ".num_fp_alu_accesses")
167 .desc("Number of float alu accesses")
168 ;
169
170 numCallsReturns
171 .name(name() + ".num_func_calls")
172 .desc("number of times a function call or return occured")
173 ;
174
175 numCondCtrlInsts
176 .name(name() + ".num_conditional_control_insts")
177 .desc("number of instructions that are conditional controls")
178 ;
179
180 numIntInsts
181 .name(name() + ".num_int_insts")
182 .desc("number of integer instructions")
183 ;
184
185 numFpInsts
186 .name(name() + ".num_fp_insts")
187 .desc("number of float instructions")
188 ;
189
190 numIntRegReads
191 .name(name() + ".num_int_register_reads")
192 .desc("number of times the integer registers were read")
193 ;
194
195 numIntRegWrites
196 .name(name() + ".num_int_register_writes")
197 .desc("number of times the integer registers were written")
198 ;
199
200 numFpRegReads
201 .name(name() + ".num_fp_register_reads")
202 .desc("number of times the floating registers were read")
203 ;
204
205 numFpRegWrites
206 .name(name() + ".num_fp_register_writes")
207 .desc("number of times the floating registers were written")
208 ;
209
210 numCCRegReads
211 .name(name() + ".num_cc_register_reads")
212 .desc("number of times the CC registers were read")
213 .flags(nozero)
214 ;
215
216 numCCRegWrites
217 .name(name() + ".num_cc_register_writes")
218 .desc("number of times the CC registers were written")
219 .flags(nozero)
220 ;
221
222 numMemRefs
223 .name(name()+".num_mem_refs")
224 .desc("number of memory refs")
225 ;
226
227 numStoreInsts
228 .name(name() + ".num_store_insts")
229 .desc("Number of store instructions")
230 ;
231
232 numLoadInsts
233 .name(name() + ".num_load_insts")
234 .desc("Number of load instructions")
235 ;
236
237 notIdleFraction
238 .name(name() + ".not_idle_fraction")
239 .desc("Percentage of non-idle cycles")
240 ;
241
242 idleFraction
243 .name(name() + ".idle_fraction")
244 .desc("Percentage of idle cycles")
245 ;
246
247 numBusyCycles
248 .name(name() + ".num_busy_cycles")
249 .desc("Number of busy cycles")
250 ;
251
252 numIdleCycles
253 .name(name()+".num_idle_cycles")
254 .desc("Number of idle cycles")
255 ;
256
257 icacheStallCycles
258 .name(name() + ".icache_stall_cycles")
259 .desc("ICache total stall cycles")
260 .prereq(icacheStallCycles)
261 ;
262
263 dcacheStallCycles
264 .name(name() + ".dcache_stall_cycles")
265 .desc("DCache total stall cycles")
266 .prereq(dcacheStallCycles)
267 ;
268
269 icacheRetryCycles
270 .name(name() + ".icache_retry_cycles")
271 .desc("ICache total retry cycles")
272 .prereq(icacheRetryCycles)
273 ;
274
275 dcacheRetryCycles
276 .name(name() + ".dcache_retry_cycles")
277 .desc("DCache total retry cycles")
278 .prereq(dcacheRetryCycles)
279 ;
280
281 statExecutedInstType
282 .init(Enums::Num_OpClass)
283 .name(name() + ".op_class")
284 .desc("Class of executed instruction")
285 .flags(total | pdf | dist)
286 ;
287 for (unsigned i = 0; i < Num_OpClasses; ++i) {
288 statExecutedInstType.subname(i, Enums::OpClassStrings[i]);
289 }
290
291 idleFraction = constant(1.0) - notIdleFraction;
292 numIdleCycles = idleFraction * numCycles;
293 numBusyCycles = (notIdleFraction)*numCycles;
294
295 numBranches
296 .name(name() + ".Branches")
297 .desc("Number of branches fetched")
298 .prereq(numBranches);
299
300 numPredictedBranches
301 .name(name() + ".predictedBranches")
302 .desc("Number of branches predicted as taken")
303 .prereq(numPredictedBranches);
304
305 numBranchMispred
306 .name(name() + ".BranchMispred")
307 .desc("Number of branch mispredictions")
308 .prereq(numBranchMispred);
309 }
310
311 void
312 BaseSimpleCPU::resetStats()
313 {
314 // startNumInst = numInst;
315 notIdleFraction = (_status != Idle);
316 }
317
318 void
319 BaseSimpleCPU::serializeThread(ostream &os, ThreadID tid)
320 {
321 assert(_status == Idle || _status == Running);
322 assert(tid == 0);
323
324 thread->serialize(os);
325 }
326
327 void
328 BaseSimpleCPU::unserializeThread(Checkpoint *cp, const string &section,
329 ThreadID tid)
330 {
331 if (tid != 0)
332 fatal("Trying to load more than one thread into a SimpleCPU\n");
333 thread->unserialize(cp, section);
334 }
335
336 void
337 change_thread_state(ThreadID tid, int activate, int priority)
338 {
339 }
340
341 Addr
342 BaseSimpleCPU::dbg_vtophys(Addr addr)
343 {
344 return vtophys(tc, addr);
345 }
346
347 void
348 BaseSimpleCPU::wakeup()
349 {
350 if (thread->status() != ThreadContext::Suspended)
351 return;
352
353 DPRINTF(Quiesce,"Suspended Processor awoke\n");
354 thread->activate();
355 }
356
357 void
358 BaseSimpleCPU::checkForInterrupts()
359 {
360 if (checkInterrupts(tc)) {
361 Fault interrupt = interrupts->getInterrupt(tc);
362
363 if (interrupt != NoFault) {
364 fetchOffset = 0;
365 interrupts->updateIntrInfo(tc);
366 interrupt->invoke(tc);
367 thread->decoder.reset();
368 }
369 }
370 }
371
372
373 void
374 BaseSimpleCPU::setupFetchRequest(Request *req)
375 {
376 Addr instAddr = thread->instAddr();
377
378 // set up memory request for instruction fetch
379 DPRINTF(Fetch, "Fetch: PC:%08p\n", instAddr);
380
381 Addr fetchPC = (instAddr & PCMask) + fetchOffset;
382 req->setVirt(0, fetchPC, sizeof(MachInst), Request::INST_FETCH, instMasterId(),
383 instAddr);
384 }
385
386
387 void
388 BaseSimpleCPU::preExecute()
389 {
390 // maintain $r0 semantics
391 thread->setIntReg(ZeroReg, 0);
392 #if THE_ISA == ALPHA_ISA
393 thread->setFloatReg(ZeroReg, 0.0);
394 #endif // ALPHA_ISA
395
396 // check for instruction-count-based events
397 comInstEventQueue[0]->serviceEvents(numInst);
398 system->instEventQueue.serviceEvents(system->totalNumInsts);
399
400 // decode the instruction
401 inst = gtoh(inst);
402
403 TheISA::PCState pcState = thread->pcState();
404
405 if (isRomMicroPC(pcState.microPC())) {
406 stayAtPC = false;
407 curStaticInst = microcodeRom.fetchMicroop(pcState.microPC(),
408 curMacroStaticInst);
409 } else if (!curMacroStaticInst) {
410 //We're not in the middle of a macro instruction
411 StaticInstPtr instPtr = NULL;
412
413 TheISA::Decoder *decoder = &(thread->decoder);
414
415 //Predecode, ie bundle up an ExtMachInst
416 //If more fetch data is needed, pass it in.
417 Addr fetchPC = (pcState.instAddr() & PCMask) + fetchOffset;
418 //if(decoder->needMoreBytes())
419 decoder->moreBytes(pcState, fetchPC, inst);
420 //else
421 // decoder->process();
422
423 //Decode an instruction if one is ready. Otherwise, we'll have to
424 //fetch beyond the MachInst at the current pc.
425 instPtr = decoder->decode(pcState);
426 if (instPtr) {
427 stayAtPC = false;
428 thread->pcState(pcState);
429 } else {
430 stayAtPC = true;
431 fetchOffset += sizeof(MachInst);
432 }
433
434 //If we decoded an instruction and it's microcoded, start pulling
435 //out micro ops
436 if (instPtr && instPtr->isMacroop()) {
437 curMacroStaticInst = instPtr;
438 curStaticInst = curMacroStaticInst->fetchMicroop(pcState.microPC());
439 } else {
440 curStaticInst = instPtr;
441 }
442 } else {
443 //Read the next micro op from the macro op
444 curStaticInst = curMacroStaticInst->fetchMicroop(pcState.microPC());
445 }
446
447 //If we decoded an instruction this "tick", record information about it.
448 if (curStaticInst) {
449 #if TRACING_ON
450 traceData = tracer->getInstRecord(curTick(), tc,
451 curStaticInst, thread->pcState(), curMacroStaticInst);
452
453 DPRINTF(Decode,"Decode: Decoded %s instruction: %#x\n",
454 curStaticInst->getName(), curStaticInst->machInst);
455 #endif // TRACING_ON
456 }
457
458 if (branchPred && curStaticInst && curStaticInst->isControl()) {
459 // Use a fake sequence number since we only have one
460 // instruction in flight at the same time.
461 const InstSeqNum cur_sn(0);
462 const ThreadID tid(0);
463 pred_pc = thread->pcState();
464 const bool predict_taken(
465 branchPred->predict(curStaticInst, cur_sn, pred_pc, tid));
466
467 if (predict_taken)
468 ++numPredictedBranches;
469 }
470 }
471
472 void
473 BaseSimpleCPU::postExecute()
474 {
475 assert(curStaticInst);
476
477 TheISA::PCState pc = tc->pcState();
478 Addr instAddr = pc.instAddr();
479 if (FullSystem && thread->profile) {
480 bool usermode = TheISA::inUserMode(tc);
481 thread->profilePC = usermode ? 1 : instAddr;
482 ProfileNode *node = thread->profile->consume(tc, curStaticInst);
483 if (node)
484 thread->profileNode = node;
485 }
486
487 if (curStaticInst->isMemRef()) {
488 numMemRefs++;
489 }
490
491 if (curStaticInst->isLoad()) {
492 ++numLoad;
493 comLoadEventQueue[0]->serviceEvents(numLoad);
494 }
495
496 if (CPA::available()) {
497 CPA::cpa()->swAutoBegin(tc, pc.nextInstAddr());
498 }
499
500 if (curStaticInst->isControl()) {
501 ++numBranches;
502 }
503
504 /* Power model statistics */
505 //integer alu accesses
506 if (curStaticInst->isInteger()){
507 numIntAluAccesses++;
508 numIntInsts++;
509 }
510
511 //float alu accesses
512 if (curStaticInst->isFloating()){
513 numFpAluAccesses++;
514 numFpInsts++;
515 }
516
517 //number of function calls/returns to get window accesses
518 if (curStaticInst->isCall() || curStaticInst->isReturn()){
519 numCallsReturns++;
520 }
521
522 //the number of branch predictions that will be made
523 if (curStaticInst->isCondCtrl()){
524 numCondCtrlInsts++;
525 }
526
527 //result bus acceses
528 if (curStaticInst->isLoad()){
529 numLoadInsts++;
530 }
531
532 if (curStaticInst->isStore()){
533 numStoreInsts++;
534 }
535 /* End power model statistics */
536
537 statExecutedInstType[curStaticInst->opClass()]++;
538
539 if (FullSystem)
540 traceFunctions(instAddr);
541
542 if (traceData) {
543 traceData->dump();
544 delete traceData;
545 traceData = NULL;
546 }
547 }
548
549 void
550 BaseSimpleCPU::advancePC(const Fault &fault)
551 {
552 const bool branching(thread->pcState().branching());
553
554 //Since we're moving to a new pc, zero out the offset
555 fetchOffset = 0;
556 if (fault != NoFault) {
557 curMacroStaticInst = StaticInst::nullStaticInstPtr;
558 fault->invoke(tc, curStaticInst);
559 thread->decoder.reset();
560 } else {
561 if (curStaticInst) {
562 if (curStaticInst->isLastMicroop())
563 curMacroStaticInst = StaticInst::nullStaticInstPtr;
564 TheISA::PCState pcState = thread->pcState();
565 TheISA::advancePC(pcState, curStaticInst);
566 thread->pcState(pcState);
567 }
568 }
569
570 if (branchPred && curStaticInst && curStaticInst->isControl()) {
571 // Use a fake sequence number since we only have one
572 // instruction in flight at the same time.
573 const InstSeqNum cur_sn(0);
574 const ThreadID tid(0);
575
576 if (pred_pc == thread->pcState()) {
577 // Correctly predicted branch
578 branchPred->update(cur_sn, tid);
579 } else {
580 // Mis-predicted branch
581 branchPred->squash(cur_sn, pcState(),
582 branching, tid);
583 ++numBranchMispred;
584 }
585 }
586 }
587
588 void
589 BaseSimpleCPU::startup()
590 {
591 BaseCPU::startup();
592 thread->startup();
593 }