arch/alpha/isa_desc

   1 // -*- mode:c++ -*-
   2 //
   3 // Alpha ISA description file.
   4 //
   5
   6 let {{
   7     global rcs_id
   8     rcs_id = "$Id$"
   9 }};
  10
  11
  12 #include <sstream>
  13 #include <iostream>
  14 #include <iomanip>
  15
  16 #include <math.h>
  17 #if defined(linux)
  18 #include <fenv.h>
  19 #endif
  20
  21 #include "base/cprintf.hh"
  22 #include "base/misc.hh"
  23 #include "cpu/exec_context.hh"
  24 #include "cpu/exetrace.hh"
  25 #include "cpu/full_cpu/full_cpu.hh"
  26 #include "cpu/full_cpu/op_class.hh"
  27 #include "cpu/full_cpu/spec_state.hh"
  28 #include "cpu/simple_cpu/simple_cpu.hh"
  29 #include "cpu/static_inst.hh"
  30 #include "sim/annotation.hh"
  31 #include "sim/sim_exit.hh"
  32
  33 #ifdef FULL_SYSTEM
  34 #include "arch/alpha/ev5.hh"
  35 #include "arch/alpha/pseudo_inst.hh"
  36 #endif
  37
  38 namespace AlphaISA;
  39
  40 // Universal (format-independent) fields
  41 def bitfield OPCODE     <31:26>;
  42 def bitfield RA         <25:21>;
  43 def bitfield RB         <20:16>;
  44
  45 // Memory format
  46 def signed bitfield MEMDISP <15: 0>; // displacement
  47 def        bitfield MEMFUNC <15: 0>; // function code (same field, unsigned)
  48
  49 // Memory-format jumps
  50 def bitfield JMPFUNC    <15:14>; // function code (disp<15:14>)
  51 def bitfield JMPHINT    <13: 0>; // tgt Icache idx hint (disp<13:0>)
  52
  53 // Branch format
  54 def signed bitfield BRDISP <20: 0>; // displacement
  55
  56 // Integer operate format(s>;
  57 def bitfield INTIMM     <20:13>; // integer immediate (literal)
  58 def bitfield IMM        <12:12>; // immediate flag
  59 def bitfield INTFUNC    <11: 5>; // function code
  60 def bitfield RC         < 4: 0>; // dest reg
  61
  62 // Floating-point operate format
  63 def bitfield FA           <25:21>;
  64 def bitfield FB           <20:16>;
  65 def bitfield FP_FULLFUNC  <15: 5>; // complete function code
  66     def bitfield FP_TRAPMODE  <15:13>; // trapping mode
  67     def bitfield FP_ROUNDMODE <12:11>; // rounding mode
  68     def bitfield FP_TYPEFUNC  <10: 5>; // type+func: handiest for decoding
  69         def bitfield FP_SRCTYPE   <10: 9>; // source reg type
  70         def bitfield FP_SHORTFUNC < 8: 5>; // short function code
  71         def bitfield FP_SHORTFUNC_TOP2 <8:7>; // top 2 bits of short func code
  72 def bitfield FC           < 4: 0>; // dest reg
  73
  74 // PALcode format
  75 def bitfield PALFUNC    <25: 0>; // function code
  76
  77 // EV5 PAL instructions:
  78 // HW_LD/HW_ST
  79 def bitfield HW_LDST_PHYS  <15>; // address is physical
  80 def bitfield HW_LDST_ALT   <14>; // use ALT_MODE IPR
  81 def bitfield HW_LDST_WRTCK <13>; // HW_LD only: fault if no write acc
  82 def bitfield HW_LDST_QUAD  <12>; // size: 0=32b, 1=64b
  83 def bitfield HW_LDST_VPTE  <11>; // HW_LD only: is PTE fetch
  84 def bitfield HW_LDST_LOCK  <10>; // HW_LD only: is load locked
  85 def bitfield HW_LDST_COND  <10>; // HW_ST only: is store conditional
  86 def signed bitfield HW_LDST_DISP  <9:0>; // signed displacement
  87
  88 // HW_REI
  89 def bitfield HW_REI_TYP <15:14>; // type: stalling vs. non-stallingk
  90 def bitfield HW_REI_MBZ <13: 0>; // must be zero
  91
  92 // HW_MTPR/MW_MFPR
  93 def bitfield HW_IPR_IDX <15:0>;  // IPR index
  94
  95 // M5 instructions
  96 def bitfield M5FUNC <7:0>;
  97
  98 let {{
  99     global operandTypeMap
 100     operandTypeMap = {
 101         'sb' : ('signed int', 8),
 102         'ub' : ('unsigned int', 8),
 103         'sw' : ('signed int', 16),
 104         'uw' : ('unsigned int', 16),
 105         'sl' : ('signed int', 32),
 106         'ul' : ('unsigned int', 32),
 107         'sq' : ('signed int', 64),
 108         'uq' : ('unsigned int', 64),
 109         'sf' : ('float', 32),
 110         'df' : ('float', 64)
 111     }
 112
 113     global operandTraitsMap
 114     operandTraitsMap = {
 115         # Int regs default to unsigned, but code should not count on this.
 116         # For clarity, descriptions that depend on unsigned behavior should
 117         # explicitly specify '.uq'.
 118         'Ra': IntRegOperandTraits('uq', 'RA', 'IsInteger', 1),
 119         'Rb': IntRegOperandTraits('uq', 'RB', 'IsInteger', 2),
 120         'Rc': IntRegOperandTraits('uq', 'RC', 'IsInteger', 3),
 121         'Fa': FloatRegOperandTraits('df', 'FA', 'IsFloating', 1),
 122         'Fb': FloatRegOperandTraits('df', 'FB', 'IsFloating', 2),
 123         'Fc': FloatRegOperandTraits('df', 'FC', 'IsFloating', 3),
 124         'Mem': MemOperandTraits('uq', None,
 125                                 ('IsMemRef', 'IsLoad', 'IsStore'), 4),
 126         'NPC': NPCOperandTraits('uq', None, ( None, None, 'IsControl' ), 4),
 127         'Runiq': ControlRegOperandTraits('uq', 'Uniq', None, 1),
 128         'FPCR':  ControlRegOperandTraits('uq', 'Fpcr', None, 1),
 129         # The next two are hacks for non-full-system call-pal emulation
 130         'R0':  IntRegOperandTraits('uq', '0', None, 1),
 131         'R16': IntRegOperandTraits('uq', '16', None, 1),
 132     }
 133
 134     defineDerivedOperandVars()
 135 }};
 136
 137 declare {{
 138 // just temporary, while comparing with old code for debugging
 139 // #define SS_COMPATIBLE_DISASSEMBLY
 140
 141     /// Check "FP enabled" machine status bit.  Called when executing any FP
 142     /// instruction in full-system mode.
 143     /// @retval Full-system mode: No_Fault if FP is enabled, Fen_Fault
 144     /// if not.  Non-full-system mode: always returns No_Fault.
 145 #ifdef FULL_SYSTEM
 146     inline Fault checkFpEnableFault(ExecContext *xc)
 147     {
 148         Fault fault = No_Fault; // dummy... this ipr access should not fault
 149         if (!ICSR_FPE(xc->readIpr(AlphaISA::IPR_ICSR, fault))) {
 150             fault = Fen_Fault;
 151         }
 152         return fault;
 153     }
 154 #else
 155     inline Fault checkFpEnableFault(ExecContext *xc)
 156     {
 157         return No_Fault;
 158     }
 159 #endif
 160
 161     /**
 162      * Base class for all Alpha static instructions.
 163      */
 164     class AlphaStaticInst : public StaticInst<AlphaISA>
 165     {
 166       protected:
 167
 168         /// Make AlphaISA register dependence tags directly visible in
 169         /// this class and derived classes.  Maybe these should really
 170         /// live here and not in the AlphaISA namespace.
 171         enum DependenceTags {
 172             FP_Base_DepTag = AlphaISA::FP_Base_DepTag,
 173             Fpcr_DepTag = AlphaISA::Fpcr_DepTag,
 174             Uniq_DepTag = AlphaISA::Uniq_DepTag,
 175             IPR_Base_DepTag = AlphaISA::IPR_Base_DepTag
 176         };
 177
 178         /// Constructor.
 179         AlphaStaticInst(const char *mnem, MachInst _machInst,
 180                         OpClass __opClass)
 181             : StaticInst<AlphaISA>(mnem, _machInst, __opClass)
 182         {
 183         }
 184
 185         /// Print a register name for disassembly given the unique
 186         /// dependence tag number (FP or int).
 187         void printReg(std::ostream &os, int reg)
 188         {
 189             if (reg < FP_Base_DepTag) {
 190                 ccprintf(os, "r%d", reg);
 191             }
 192             else {
 193                 ccprintf(os, "f%d", reg - FP_Base_DepTag);
 194             }
 195         }
 196
 197         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
 198         {
 199             std::stringstream ss;
 200
 201             ccprintf(ss, "%-10s ", mnemonic);
 202
 203             // just print the first two source regs... if there's
 204             // a third one, it's a read-modify-write dest (Rc),
 205             // e.g. for CMOVxx
 206             if (_numSrcRegs > 0) {
 207                 printReg(ss, _srcRegIdx[0]);
 208             }
 209             if (_numSrcRegs > 1) {
 210                 ss << ",";
 211                 printReg(ss, _srcRegIdx[1]);
 212             }
 213
 214             // just print the first dest... if there's a second one,
 215             // it's generally implicit
 216             if (_numDestRegs > 0) {
 217                 if (_numSrcRegs > 0)
 218                     ss << ",";
 219                 printReg(ss, _destRegIdx[0]);
 220             }
 221
 222             return ss.str();
 223         }
 224     };
 225 }};
 226
 227
 228 def template BasicDeclare {{
 229     /**
 230      * Static instruction class for "%(mnemonic)s".
 231      */
 232     class %(class_name)s : public %(base_class)s
 233     {
 234       public:
 235         /// Constructor.
 236         %(class_name)s(MachInst machInst)
 237              : %(base_class)s("%(mnemonic)s", machInst, %(op_class)s)
 238         {
 239             %(constructor)s;
 240         }
 241
 242         Fault execute(SimpleCPU *cpu, ExecContext *xc,
 243                       Trace::InstRecord *traceData)
 244         {
 245             SimpleCPU *memAccessObj __attribute__((unused)) = cpu;
 246             Fault fault = No_Fault;
 247
 248             %(fp_enable_check)s;
 249             %(exec_decl)s;
 250             %(simple_rd)s;
 251             %(code)s;
 252
 253             if (fault == No_Fault) {
 254                 %(simple_wb)s;
 255             }
 256
 257             return fault;
 258         }
 259
 260         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
 261                       Trace::InstRecord *traceData)
 262         {
 263             DynInst *memAccessObj __attribute__((unused)) = dynInst;
 264             Fault fault = No_Fault;
 265
 266             %(fp_enable_check)s;
 267             %(exec_decl)s;
 268             %(dtld_rd)s;
 269             %(code)s;
 270
 271             if (fault == No_Fault) {
 272                 %(dtld_wb)s;
 273             }
 274
 275             return fault;
 276         }
 277     };
 278 }};
 279
 280 def template BasicDecode {{
 281     return new %(class_name)s(machInst);
 282 }};
 283
 284 def template BasicDecodeWithMnemonic {{
 285     return new %(class_name)s("%(mnemonic)s", machInst);
 286 }};
 287
 288 // The most basic instruction format... used only for a few misc. insts
 289 def format BasicOperate(code, *flags) {{
 290     iop = InstObjParams(name, Name, 'AlphaStaticInst', CodeBlock(code), flags)
 291     return iop.subst('BasicDeclare', 'BasicDecode')
 292 }};
 293
 294
 295
 296 ////////////////////////////////////////////////////////////////////
 297
 298 declare {{
 299     /**
 300      * Static instruction class for no-ops.  This is a leaf class.
 301      */
 302     class Nop : public AlphaStaticInst
 303     {
 304         /// Disassembly of original instruction.
 305         const std::string originalDisassembly;
 306
 307       public:
 308         /// Constructor
 309         Nop(const std::string _originalDisassembly, MachInst _machInst)
 310             : AlphaStaticInst("nop", _machInst, No_OpClass),
 311               originalDisassembly(_originalDisassembly)
 312         {
 313             flags[IsNop] = true;
 314         }
 315
 316         ~Nop() { }
 317
 318         Fault execute(SimpleCPU *cpu, ExecContext *xc,
 319                       Trace::InstRecord *traceData)
 320         {
 321             return No_Fault;
 322         }
 323
 324         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
 325                       Trace::InstRecord *traceData)
 326         {
 327             return No_Fault;
 328         }
 329
 330         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
 331         {
 332 #ifdef SS_COMPATIBLE_DISASSEMBLY
 333             return originalDisassembly;
 334 #else
 335             return csprintf("%-10s (%s)", "nop", originalDisassembly);
 336 #endif
 337         }
 338     };
 339
 340     /// Helper function for decoding nops.  Substitute Nop object
 341     /// for original inst passed in as arg (and delete latter).
 342     inline
 343     AlphaStaticInst *
 344     makeNop(AlphaStaticInst *inst)
 345     {
 346         AlphaStaticInst *nop = new Nop(inst->disassemble(0), inst->machInst);
 347         delete inst;
 348         return nop;
 349     }
 350 }};
 351
 352 def format Nop() {{
 353     return ('', 'return new Nop("%s", machInst);\n' % name)
 354 }};
 355
 356
 357 // integer & FP operate instructions use Rc as dest, so check for
 358 // Rc == 31 to detect nops
 359 def template OperateNopCheckDecode {{
 360  {
 361      AlphaStaticInst *i = new %(class_name)s(machInst);
 362      if (RC == 31) {
 363          i = makeNop(i);
 364      }
 365      return i;
 366  }
 367 }};
 368
 369 // Like BasicOperate format, but generates NOP if RC/FC == 31
 370 def format BasicOperateWithNopCheck(code, *opt_args) {{
 371     iop = InstObjParams(name, Name, 'AlphaStaticInst', CodeBlock(code),
 372                         opt_args)
 373     return iop.subst('BasicDeclare', 'OperateNopCheckDecode')
 374 }};
 375
 376
 377 ////////////////////////////////////////////////////////////////////
 378 //
 379 // Integer operate instructions
 380 //
 381
 382 declare {{
 383     /**
 384      * Base class for integer immediate instructions.
 385      */
 386     class IntegerImm : public AlphaStaticInst
 387     {
 388       protected:
 389         /// Immediate operand value (unsigned 8-bit int).
 390         uint8_t imm;
 391
 392         /// Constructor
 393         IntegerImm(const char *mnem, MachInst _machInst, OpClass __opClass)
 394             : AlphaStaticInst(mnem, _machInst, __opClass), imm(INTIMM)
 395         {
 396         }
 397
 398         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
 399         {
 400             std::stringstream ss;
 401
 402             ccprintf(ss, "%-10s ", mnemonic);
 403
 404             // just print the first source reg... if there's
 405             // a second one, it's a read-modify-write dest (Rc),
 406             // e.g. for CMOVxx
 407             if (_numSrcRegs > 0) {
 408                 printReg(ss, _srcRegIdx[0]);
 409                 ss << ",";
 410             }
 411
 412             ss << (int)imm;
 413
 414             if (_numDestRegs > 0) {
 415                 ss << ",";
 416                 printReg(ss, _destRegIdx[0]);
 417             }
 418
 419             return ss.str();
 420         }
 421     };
 422 }};
 423
 424 def template RegOrImmDecode {{
 425  {
 426      AlphaStaticInst *i =
 427          (IMM) ? (AlphaStaticInst *)new %(class_name)sImm(machInst)
 428          : (AlphaStaticInst *)new %(class_name)s(machInst);
 429      if (RC == 31) {
 430          i = makeNop(i);
 431      }
 432      return i;
 433  }
 434 }};
 435
 436 // Primary format for integer operate instructions:
 437 // - Generates both reg-reg and reg-imm versions if Rb_or_imm is used.
 438 // - Generates NOP if RC == 31.
 439 def format IntegerOperate(code, *opt_flags) {{
 440     # If the code block contains 'Rb_or_imm', we define two instructions,
 441     # one using 'Rb' and one using 'imm', and have the decoder select
 442     # the right one.
 443     uses_imm = (code.find('Rb_or_imm') != -1)
 444     if uses_imm:
 445         orig_code = code
 446         # base code is reg version:
 447         # rewrite by substituting 'Rb' for 'Rb_or_imm'
 448         code = re.sub(r'Rb_or_imm', 'Rb', orig_code)
 449         # generate immediate version by substituting 'imm'
 450         # note that imm takes no extenstion, so we extend
 451         # the regexp to replace any extension as well
 452         imm_code = re.sub(r'Rb_or_imm(\.\w+)?', 'imm', orig_code)
 453
 454     # generate declaration for register version
 455     cblk = CodeBlock(code)
 456     iop = InstObjParams(name, Name, 'AlphaStaticInst', cblk, opt_flags)
 457     decls = iop.subst('BasicDeclare')
 458
 459     if uses_imm:
 460         # append declaration for imm version
 461         imm_cblk = CodeBlock(imm_code)
 462         imm_iop = InstObjParams(name, Name + 'Imm', 'IntegerImm', imm_cblk,
 463                                 opt_flags)
 464         decls += imm_iop.subst('BasicDeclare')
 465         # decode checks IMM bit to pick correct version
 466         decode = iop.subst('RegOrImmDecode')
 467     else:
 468         # no imm version: just check for nop
 469         decode = iop.subst('OperateNopCheckDecode')
 470
 471     return (decls, decode)
 472 }};
 473
 474
 475 ////////////////////////////////////////////////////////////////////
 476 //
 477 // Floating-point instructions
 478 //
 479 //      Note that many FP-type instructions which do not support all the
 480 //      various rounding & trapping modes use the simpler format
 481 //      BasicOperateWithNopCheck.
 482 //
 483
 484 declare {{
 485     /**
 486      * Base class for general floating-point instructions.  Includes
 487      * support for various Alpha rounding and trapping modes.  Only FP
 488      * instructions that require this support are derived from this
 489      * class; the rest derive directly from AlphaStaticInst.
 490      */
 491     class AlphaFP : public  AlphaStaticInst
 492     {
 493       public:
 494         /// Alpha FP rounding modes.
 495         enum RoundingMode {
 496             Chopped = 0,        ///< round toward zero
 497             Minus_Infinity = 1, ///< round toward minus infinity
 498             Normal = 2,         ///< round to nearest (default)
 499             Dynamic = 3,        ///< use FPCR setting (in instruction)
 500             Plus_Infinity = 3   ///< round to plus inifinity (in FPCR)
 501         };
 502
 503         /// Alpha FP trapping modes.
 504         /// For instructions that produce integer results, the
 505         /// "Underflow Enable" modes really mean "Overflow Enable", and
 506         /// the assembly modifier is V rather than U.
 507         enum TrappingMode {
 508             /// default: nothing enabled
 509             Imprecise = 0,                 ///< no modifier
 510             /// underflow/overflow traps enabled, inexact disabled
 511             Underflow_Imprecise = 1,       ///< /U or /V
 512             Underflow_Precise = 5,         ///< /SU or /SV
 513             /// underflow/overflow and inexact traps enabled
 514             Underflow_Inexact_Precise = 7  ///< /SUI or /SVI
 515         };
 516
 517       protected:
 518 #if defined(linux)
 519         static const int alphaToC99RoundingMode[];
 520 #endif
 521
 522         /// Map enum RoundingMode values to disassembly suffixes.
 523         static const char *roundingModeSuffix[];
 524         /// Map enum TrappingMode values to FP disassembly suffixes.
 525         static const char *fpTrappingModeSuffix[];
 526         /// Map enum TrappingMode values to integer disassembly suffixes.
 527         static const char *intTrappingModeSuffix[];
 528
 529         /// This instruction's rounding mode.
 530         RoundingMode roundingMode;
 531         /// This instruction's trapping mode.
 532         TrappingMode trappingMode;
 533
 534         /// Constructor
 535         AlphaFP(const char *mnem, MachInst _machInst, OpClass __opClass)
 536             : AlphaStaticInst(mnem, _machInst, __opClass),
 537               roundingMode((enum RoundingMode)FP_ROUNDMODE),
 538               trappingMode((enum TrappingMode)FP_TRAPMODE)
 539         {
 540             if (trappingMode != Imprecise) {
 541                 warn("precise FP traps unimplemented\n");
 542             }
 543         }
 544
 545 #if defined(linux)
 546         int
 547         getC99RoundingMode(ExecContext *xc)
 548         {
 549             if (roundingMode == Dynamic) {
 550                 return alphaToC99RoundingMode[bits(xc->readFpcr(), 59, 58)];
 551             }
 552             else {
 553                 return alphaToC99RoundingMode[roundingMode];
 554             }
 555         }
 556 #endif
 557
 558         // This differs from the AlphaStaticInst version only in
 559         // printing suffixes for non-default rounding & trapping modes.
 560         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
 561         {
 562             std::string mnem_str(mnemonic);
 563
 564 #ifndef SS_COMPATIBLE_DISASSEMBLY
 565             std::string suffix("");
 566             suffix += ((_destRegIdx[0] >= FP_Base_DepTag)
 567                        ? fpTrappingModeSuffix[trappingMode]
 568                        : intTrappingModeSuffix[trappingMode]);
 569             suffix += roundingModeSuffix[roundingMode];
 570
 571             if (suffix != "") {
 572                 mnem_str = csprintf("%s/%s", mnemonic, suffix);
 573             }
 574 #endif
 575
 576             std::stringstream ss;
 577             ccprintf(ss, "%-10s ", mnem_str.c_str());
 578
 579             // just print the first two source regs... if there's
 580             // a third one, it's a read-modify-write dest (Rc),
 581             // e.g. for CMOVxx
 582             if (_numSrcRegs > 0) {
 583                 printReg(ss, _srcRegIdx[0]);
 584             }
 585             if (_numSrcRegs > 1) {
 586                 ss << ",";
 587                 printReg(ss, _srcRegIdx[1]);
 588             }
 589
 590             // just print the first dest... if there's a second one,
 591             // it's generally implicit
 592             if (_numDestRegs > 0) {
 593                 if (_numSrcRegs > 0)
 594                     ss << ",";
 595                 printReg(ss, _destRegIdx[0]);
 596             }
 597
 598             return ss.str();
 599         }
 600     };
 601
 602 #if defined(linux)
 603     const int AlphaFP::alphaToC99RoundingMode[] = {
 604         FE_TOWARDZERO,  // Chopped
 605         FE_DOWNWARD,    // Minus_Infinity
 606         FE_TONEAREST,   // Normal
 607         FE_UPWARD       // Dynamic in inst, Plus_Infinity in FPCR
 608     };
 609 #endif
 610
 611     const char *AlphaFP::roundingModeSuffix[] = { "c", "m", "", "d" };
 612     // mark invalid trapping modes, but don't fail on them, because
 613     // you could decode anything on a misspeculated path
 614     const char *AlphaFP::fpTrappingModeSuffix[] =
 615         { "", "u", "INVTM2", "INVTM3", "INVTM4", "su", "INVTM6", "sui" };
 616     const char *AlphaFP::intTrappingModeSuffix[] =
 617         { "", "v", "INVTM2", "INVTM3", "INVTM4", "sv", "INVTM6", "svi" };
 618 }};
 619
 620
 621 def template FloatingPointDeclare {{
 622     /**
 623      * "Fast" static instruction class for "%(mnemonic)s" (imprecise
 624      * trapping mode, normal rounding mode).
 625      */
 626     class %(class_name)sFast : public %(base_class)s
 627     {
 628       public:
 629         /// Constructor.
 630         %(class_name)sFast(MachInst machInst)
 631              : %(base_class)s("%(mnemonic)s", machInst, %(op_class)s)
 632         {
 633             %(constructor)s;
 634         }
 635
 636         Fault execute(SimpleCPU *cpu, ExecContext *xc,
 637                       Trace::InstRecord *traceData)
 638         {
 639             Fault fault = No_Fault;
 640
 641             %(fp_enable_check)s;
 642             %(exec_decl)s;
 643             %(simple_rd)s;
 644             %(code)s;
 645
 646             if (fault == No_Fault) {
 647                 %(simple_wb)s;
 648             }
 649
 650             return fault;
 651         }
 652
 653         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
 654                       Trace::InstRecord *traceData)
 655         {
 656             Fault fault = No_Fault;
 657
 658             %(fp_enable_check)s;
 659             %(exec_decl)s;
 660             %(dtld_rd)s;
 661             %(code)s;
 662
 663             if (fault == No_Fault) {
 664                 %(dtld_wb)s;
 665             }
 666
 667             return fault;
 668         }
 669     };
 670
 671     /**
 672      * General static instruction class for "%(mnemonic)s".  Supports
 673      * all the various rounding and trapping modes.
 674      */
 675     class %(class_name)sGeneral : public %(base_class)s
 676     {
 677       public:
 678         /// Constructor.
 679         %(class_name)sGeneral(MachInst machInst)
 680              : %(base_class)s("%(mnemonic)s", machInst, %(op_class)s)
 681         {
 682             %(constructor)s;
 683         }
 684
 685         Fault execute(SimpleCPU *cpu, ExecContext *xc,
 686                       Trace::InstRecord *traceData)
 687         {
 688             Fault fault = No_Fault;
 689
 690             %(fp_enable_check)s;
 691             %(exec_decl)s;
 692             %(simple_rd)s;
 693
 694 #if defined(linux)
 695             fesetround(getC99RoundingMode(xc));
 696 #endif
 697
 698             %(code)s;
 699
 700 #if defined(linux)
 701             fesetround(FE_TONEAREST);
 702 #endif
 703
 704             if (fault == No_Fault) {
 705                 %(simple_wb)s;
 706             }
 707
 708             return fault;
 709         }
 710
 711         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
 712                       Trace::InstRecord *traceData)
 713         {
 714             Fault fault = No_Fault;
 715
 716             %(fp_enable_check)s;
 717             %(exec_decl)s;
 718             %(dtld_rd)s;
 719
 720 #if defined(linux)
 721             fesetround(getC99RoundingMode(xc));
 722 #endif
 723
 724             %(code)s;
 725
 726 #if defined(linux)
 727             fesetround(FE_TONEAREST);
 728 #endif
 729
 730             if (fault == No_Fault) {
 731                 %(dtld_wb)s;
 732             }
 733
 734             return fault;
 735         }
 736     };
 737 }};
 738
 739 def template FloatingPointDecode {{
 740  {
 741      bool fast = (FP_TRAPMODE == AlphaFP::Imprecise
 742                   && FP_ROUNDMODE == AlphaFP::Normal);
 743      AlphaStaticInst *i =
 744          fast ? (AlphaStaticInst *)new %(class_name)sFast(machInst) :
 745                 (AlphaStaticInst *)new %(class_name)sGeneral(machInst);
 746
 747      if (FC == 31) {
 748          i = makeNop(i);
 749      }
 750
 751      return i;
 752  }
 753 }};
 754
 755
 756 // General format for floating-point operate instructions:
 757 // - Checks trapping and rounding mode flags.  Trapping modes
 758 //   currently unimplemented (will fail).
 759 // - Generates NOP if FC == 31.
 760 def format FloatingPointOperate(code, *opt_args) {{
 761     iop = InstObjParams(name, Name, 'AlphaFP', CodeBlock(code),
 762                         opt_args)
 763     return iop.subst('FloatingPointDeclare', 'FloatingPointDecode')
 764 }};
 765
 766
 767 ////////////////////////////////////////////////////////////////////
 768 //
 769 // Memory-format instructions: LoadAddress, Load, Store
 770 //
 771
 772 declare {{
 773     /**
 774      * Base class for general Alpha memory-format instructions.
 775      */
 776     class Memory : public AlphaStaticInst
 777     {
 778       protected:
 779
 780         /// Displacement for EA calculation (signed).
 781         int32_t disp;
 782         /// Memory request flags.  See mem_req_base.hh.
 783         unsigned memAccessFlags;
 784
 785         /// Constructor
 786         Memory(const char *mnem, MachInst _machInst, OpClass __opClass)
 787             : AlphaStaticInst(mnem, _machInst, __opClass),
 788               disp(MEMDISP), memAccessFlags(0)
 789         {
 790         }
 791
 792         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
 793         {
 794             return csprintf("%-10s %c%d,%d(r%d)", mnemonic,
 795                             flags[IsFloating] ? 'f' : 'r', RA, MEMDISP, RB);
 796         }
 797     };
 798
 799     /**
 800      * Base class for a few miscellaneous memory-format insts
 801      * that don't interpret the disp field: wh64, fetch, fetch_m, ecb.
 802      * None of these instructions has a destination register either.
 803      */
 804     class MemoryNoDisp : public AlphaStaticInst
 805     {
 806       protected:
 807         /// Memory request flags.  See mem_req_base.hh.
 808         unsigned memAccessFlags;
 809
 810         /// Constructor
 811         MemoryNoDisp(const char *mnem, MachInst _machInst, OpClass __opClass)
 812             : AlphaStaticInst(mnem, _machInst, __opClass),
 813               memAccessFlags(0)
 814         {
 815         }
 816
 817         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
 818         {
 819             return csprintf("%-10s (r%d)", mnemonic, RB);
 820         }
 821     };
 822
 823     /**
 824      * Base class for "fake" effective-address computation
 825      * instructions returnded by eaCompInst().
 826      */
 827     class EACompBase : public AlphaStaticInst
 828     {
 829       public:
 830         /// Constructor
 831         EACompBase(MachInst machInst)
 832             : AlphaStaticInst("(eacomp)", machInst, IntALU)
 833         {
 834         }
 835
 836         Fault execute(SimpleCPU *cpu, ExecContext *xc,
 837                       Trace::InstRecord *traceData)
 838         { panic("attempt to execute eacomp"); }
 839
 840         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
 841                       Trace::InstRecord *traceData)
 842         { panic("attempt to execute eacomp"); }
 843     };
 844
 845     /**
 846      * Base class for "fake" memory-access instructions returnded by
 847      * memAccInst().
 848      */
 849     class MemAccBase : public AlphaStaticInst
 850     {
 851       public:
 852         /// Constructor
 853         MemAccBase(MachInst machInst, OpClass __opClass)
 854             : AlphaStaticInst("(memacc)", machInst, __opClass)
 855         {
 856         }
 857
 858         Fault execute(SimpleCPU *cpu, ExecContext *xc,
 859                       Trace::InstRecord *traceData)
 860         { panic("attempt to execute memacc"); }
 861
 862         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
 863                       Trace::InstRecord *traceData)
 864         { panic("attempt to execute memacc"); }
 865     };
 866
 867 }};
 868
 869
 870 def format LoadAddress(code) {{
 871     iop = InstObjParams(name, Name, 'Memory', CodeBlock(code))
 872     return iop.subst('BasicDeclare', 'BasicDecode')
 873 }};
 874
 875
 876 def template LoadStoreDeclare {{
 877     /**
 878      * Static instruction class for "%(mnemonic)s".
 879      */
 880     class %(class_name)s : public %(base_class)s
 881     {
 882       protected:
 883
 884         /**
 885          * "Fake" effective address computation class for "%(mnemonic)s".
 886          */
 887         class EAComp : public EACompBase
 888         {
 889           public:
 890             /// Constructor
 891             EAComp(MachInst machInst)
 892                 : EACompBase(machInst)
 893             {
 894                 %(ea_constructor)s;
 895             }
 896         };
 897
 898         /**
 899          * "Fake" memory access instruction class for "%(mnemonic)s".
 900          */
 901         class MemAcc : public MemAccBase
 902         {
 903           public:
 904             /// Constructor
 905             MemAcc(MachInst machInst)
 906                 : MemAccBase(machInst, %(op_class)s)
 907             {
 908                 %(memacc_constructor)s;
 909             }
 910         };
 911
 912         /// Pointer to EAComp object.
 913         StaticInstPtr<AlphaISA> eaCompPtr;
 914         /// Pointer to MemAcc object.
 915         StaticInstPtr<AlphaISA> memAccPtr;
 916
 917       public:
 918
 919         StaticInstPtr<AlphaISA> eaCompInst() { return eaCompPtr; }
 920         StaticInstPtr<AlphaISA> memAccInst() { return memAccPtr; }
 921
 922         /// Constructor.
 923         %(class_name)s(MachInst machInst)
 924              : %(base_class)s("%(mnemonic)s", machInst, %(op_class)s),
 925                eaCompPtr(new EAComp(machInst)), memAccPtr(new MemAcc(machInst))
 926         {
 927             %(constructor)s;
 928         }
 929
 930         Fault execute(SimpleCPU *cpu, ExecContext *xc,
 931                       Trace::InstRecord *traceData)
 932         {
 933             SimpleCPU *memAccessObj = cpu;
 934             Addr EA;
 935             Fault fault = No_Fault;
 936
 937             %(fp_enable_check)s;
 938             %(exec_decl)s;
 939             %(simple_nonmem_rd)s;
 940             %(ea_code)s;
 941
 942             if (fault == No_Fault) {
 943                 %(simple_mem_rd)s;
 944                 %(memacc_code)s;
 945             }
 946
 947             if (fault == No_Fault) {
 948                 %(simple_mem_wb)s;
 949             }
 950
 951             if (fault == No_Fault) {
 952                 %(postacc_code)s;
 953             }
 954
 955             if (fault == No_Fault) {
 956                 %(simple_nonmem_wb)s;
 957             }
 958
 959             return fault;
 960         }
 961
 962         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
 963                       Trace::InstRecord *traceData)
 964         {
 965             DynInst *memAccessObj = dynInst;
 966             Addr EA;
 967             Fault fault = No_Fault;
 968
 969             %(fp_enable_check)s;
 970             %(exec_decl)s;
 971             %(dtld_nonmem_rd)s;
 972             %(ea_code)s;
 973
 974             if (fault == No_Fault) {
 975                 %(dtld_mem_rd)s;
 976                 %(memacc_code)s;
 977             }
 978
 979             if (fault == No_Fault) {
 980                 %(dtld_mem_wb)s;
 981             }
 982
 983             if (fault == No_Fault) {
 984                 %(postacc_code)s;
 985             }
 986
 987             if (fault == No_Fault) {
 988                 %(dtld_nonmem_wb)s;
 989             }
 990
 991             return fault;
 992         }
 993     };
 994 }};
 995
 996
 997 def template PrefetchDeclare {{
 998     /**
 999      * Static instruction class for "%(mnemonic)s".
1000      */
1001     class %(class_name)s : public %(base_class)s
1002     {
1003       public:
1004         /// Constructor
1005         %(class_name)s(MachInst machInst)
1006              : %(base_class)s("%(mnemonic)s", machInst, %(op_class)s)
1007         {
1008             %(constructor)s;
1009         }
1010
1011         Fault execute(SimpleCPU *cpu, ExecContext *xc,
1012                       Trace::InstRecord *traceData)
1013         {
1014             Addr EA;
1015             Fault fault = No_Fault;
1016
1017             %(fp_enable_check)s;
1018             %(exec_decl)s;
1019             %(simple_nonmem_rd)s;
1020             %(ea_code)s;
1021
1022             if (fault == No_Fault) {
1023                 cpu->prefetch(EA, memAccessFlags);
1024             }
1025
1026             return No_Fault;
1027         }
1028
1029         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
1030                       Trace::InstRecord *traceData)
1031         {
1032             Addr EA;
1033             Fault fault = No_Fault;
1034
1035             %(fp_enable_check)s;
1036             %(exec_decl)s;
1037             %(dtld_nonmem_rd)s;
1038             %(ea_code)s;
1039
1040             if (fault == No_Fault) {
1041                 dynInst->prefetch(EA, memAccessFlags);
1042             }
1043
1044             return No_Fault;
1045         }
1046     };
1047 }};
1048
1049
1050 // load instructions use Ra as dest, so check for
1051 // Ra == 31 to detect nops
1052 def template LoadNopCheckDecode {{
1053  {
1054      AlphaStaticInst *i = new %(class_name)s(machInst);
1055      if (RA == 31) {
1056          i = makeNop(i);
1057      }
1058      return i;
1059  }
1060 }};
1061
1062
1063 // for some load instructions, Ra == 31 indicates a prefetch (not a nop)
1064 def template LoadPrefetchCheckDecode {{
1065  {
1066      if (RA != 31) {
1067          return new %(class_name)s(machInst);
1068      }
1069      else {
1070          return new %(class_name)sPrefetch(machInst);
1071      }
1072  }
1073 }};
1074
1075
1076 let {{
1077 global LoadStoreBase
1078 def LoadStoreBase(name, Name, ea_code, memacc_code, postacc_code = '',
1079                   base_class = 'Memory', flags = [],
1080                   declare_template = 'LoadStoreDeclare',
1081                   decode_template = 'BasicDecode'):
1082     # Segregate flags into instruction flags (handled by InstObjParams)
1083     # and memory access flags (handled here).
1084
1085     # Would be nice to autogenerate this list, but oh well.
1086     valid_mem_flags = ['LOCKED', 'EVICT_NEXT', 'PF_EXCLUSIVE']
1087     inst_flags = []
1088     mem_flags = []
1089     for f in flags:
1090         if f in valid_mem_flags:
1091             mem_flags.append(f)
1092         else:
1093             inst_flags.append(f)
1094
1095     ea_cblk = CodeBlock(ea_code)
1096     memacc_cblk = CodeBlock(memacc_code)
1097     postacc_cblk = CodeBlock(postacc_code)
1098
1099     cblk = CodeBlock(ea_code + memacc_code + postacc_code)
1100     iop = InstObjParams(name, Name, base_class, cblk, inst_flags)
1101
1102     iop.ea_constructor = ea_cblk.constructor
1103     iop.ea_code = ea_cblk.code
1104     iop.memacc_constructor = memacc_cblk.constructor
1105     iop.memacc_code = memacc_cblk.code
1106     iop.postacc_code = postacc_cblk.code
1107
1108     mem_flags = string.join(mem_flags, '|')
1109     if mem_flags != '':
1110         iop.constructor += '\n\tmemAccessFlags = ' + mem_flags + ';'
1111
1112     return iop.subst(declare_template, decode_template)
1113 }};
1114
1115
1116 def format LoadOrNop(ea_code, memacc_code, *flags) {{
1117     return LoadStoreBase(name, Name, ea_code, memacc_code,
1118                          flags = flags,
1119                          decode_template = 'LoadNopCheckDecode')
1120 }};
1121
1122
1123 // Note that the flags passed in apply only to the prefetch version
1124 def format LoadOrPrefetch(ea_code, memacc_code, *pf_flags) {{
1125     # declare the load instruction object and generate the decode block
1126     (decls, decode) = \
1127         LoadStoreBase(name, Name, ea_code, memacc_code,
1128                       decode_template = 'LoadPrefetchCheckDecode')
1129
1130     # Declare the prefetch instruction object.
1131
1132     # convert flags from tuple to list to make them mutable
1133     pf_flags = list(pf_flags) + ['IsMemRef', 'IsLoad', 'IsDataPrefetch', 'RdPort']
1134
1135     (pfdecls, pfdecode) = \
1136         LoadStoreBase(name, Name + 'Prefetch', ea_code, '',
1137                       flags = pf_flags,
1138                       declare_template = 'PrefetchDeclare')
1139
1140     return (decls + pfdecls, decode)
1141 }};
1142
1143
1144 def format Store(ea_code, memacc_code, *flags) {{
1145     return LoadStoreBase(name, Name, ea_code, memacc_code,
1146                          flags = flags)
1147 }};
1148
1149
1150 def format StoreCond(ea_code, memacc_code, postacc_code, *flags) {{
1151     return LoadStoreBase(name, Name, ea_code, memacc_code, postacc_code,
1152                          flags = flags)
1153 }};
1154
1155
1156 // Use 'MemoryNoDisp' as base: for wh64, fetch, ecb
1157 def format MiscPrefetch(ea_code, memacc_code, *flags) {{
1158     return LoadStoreBase(name, Name, ea_code, memacc_code,
1159                          flags = flags, base_class = 'MemoryNoDisp')
1160 }};
1161
1162
1163 ////////////////////////////////////////////////////////////////////
1164
1165
1166 declare {{
1167
1168     /**
1169      * Base class for instructions whose disassembly is not purely a
1170      * function of the machine instruction (i.e., it depends on the
1171      * PC).  This class overrides the disassemble() method to check
1172      * the PC and symbol table values before re-using a cached
1173      * disassembly string.  This is necessary for branches and jumps,
1174      * where the disassembly string includes the target address (which
1175      * may depend on the PC and/or symbol table).
1176      */
1177     class PCDependentDisassembly : public AlphaStaticInst
1178     {
1179       protected:
1180         /// Cached program counter from last disassembly
1181         Addr               cachedPC;
1182         /// Cached symbol table pointer from last disassembly
1183         const SymbolTable *cachedSymtab;
1184
1185         /// Constructor
1186         PCDependentDisassembly(const char *mnem, MachInst _machInst,
1187                                OpClass __opClass)
1188             : AlphaStaticInst(mnem, _machInst, __opClass),
1189               cachedPC(0), cachedSymtab(0)
1190         {
1191         }
1192
1193         const std::string &disassemble(Addr pc, const SymbolTable *symtab)
1194         {
1195             if (!cachedDisassembly ||
1196                 pc != cachedPC || symtab != cachedSymtab)
1197             {
1198                 if (cachedDisassembly)
1199                     delete cachedDisassembly;
1200
1201                 cachedDisassembly =
1202                     new std::string(generateDisassembly(pc, symtab));
1203                 cachedPC = pc;
1204                 cachedSymtab = symtab;
1205             }
1206
1207             return *cachedDisassembly;
1208         }
1209     };
1210
1211     /**
1212      * Base class for branches (PC-relative control transfers),
1213      * conditional or unconditional.
1214      */
1215     class Branch : public PCDependentDisassembly
1216     {
1217       protected:
1218         /// Displacement to target address (signed).
1219         int32_t disp;
1220
1221         /// Constructor.
1222         Branch(const char *mnem, MachInst _machInst, OpClass __opClass)
1223             : PCDependentDisassembly(mnem, _machInst, __opClass),
1224               disp(BRDISP << 2)
1225         {
1226         }
1227
1228         Addr branchTarget(Addr branchPC)
1229         {
1230             return branchPC + 4 + disp;
1231         }
1232
1233         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
1234         {
1235             std::stringstream ss;
1236
1237             ccprintf(ss, "%-10s ", mnemonic);
1238
1239             // There's only one register arg (RA), but it could be
1240             // either a source (the condition for conditional
1241             // branches) or a destination (the link reg for
1242             // unconditional branches)
1243             if (_numSrcRegs > 0) {
1244                 printReg(ss, _srcRegIdx[0]);
1245                 ss << ",";
1246             }
1247             else if (_numDestRegs > 0) {
1248                 printReg(ss, _destRegIdx[0]);
1249                 ss << ",";
1250             }
1251
1252 #ifdef SS_COMPATIBLE_DISASSEMBLY
1253             if (_numSrcRegs == 0 && _numDestRegs == 0) {
1254                 printReg(ss, 31);
1255                 ss << ",";
1256             }
1257 #endif
1258
1259             Addr target = pc + 4 + disp;
1260
1261             std::string str;
1262             if (symtab && symtab->findSymbol(target, str))
1263                 ss << str;
1264             else
1265                 ccprintf(ss, "0x%x", target);
1266
1267             return ss.str();
1268         }
1269     };
1270
1271     /**
1272      * Base class for jumps (register-indirect control transfers).  In
1273      * the Alpha ISA, these are always unconditional.
1274      */
1275     class Jump : public PCDependentDisassembly
1276     {
1277       protected:
1278
1279         /// Displacement to target address (signed).
1280         int32_t disp;
1281
1282       public:
1283         /// Constructor
1284         Jump(const char *mnem, MachInst _machInst, OpClass __opClass)
1285             : PCDependentDisassembly(mnem, _machInst, __opClass),
1286               disp(BRDISP)
1287         {
1288         }
1289
1290         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
1291         {
1292             std::stringstream ss;
1293
1294             ccprintf(ss, "%-10s ", mnemonic);
1295
1296 #ifdef SS_COMPATIBLE_DISASSEMBLY
1297             if (_numDestRegs == 0) {
1298                 printReg(ss, 31);
1299                 ss << ",";
1300             }
1301 #endif
1302
1303             if (_numDestRegs > 0) {
1304                 printReg(ss, _destRegIdx[0]);
1305                 ss << ",";
1306             }
1307
1308             ccprintf(ss, "(r%d)", RB);
1309
1310             return ss.str();
1311         }
1312     };
1313 }};
1314
1315 def template JumpOrBranchDecode {{
1316     return (RA == 31)
1317         ? (StaticInst<AlphaISA> *)new %(class_name)s(machInst)
1318         : (StaticInst<AlphaISA> *)new %(class_name)sAndLink(machInst);
1319 }};
1320
1321 def format CondBranch(code) {{
1322     code = 'bool cond;\n' + code + '\nif (cond) NPC = NPC + disp;\n';
1323     iop = InstObjParams(name, Name, 'Branch', CodeBlock(code),
1324                         ('IsDirectControl', 'IsCondControl'))
1325     return iop.subst('BasicDeclare', 'BasicDecode')
1326 }};
1327
1328 let {{
1329 global UncondCtrlBase
1330 def UncondCtrlBase(name, Name, base_class, npc_expr, flags):
1331     # Declare basic control transfer w/o link (i.e. link reg is R31)
1332     nolink_code = 'NPC = %s;\n' % npc_expr
1333     nolink_iop = InstObjParams(name, Name, base_class,
1334                                CodeBlock(nolink_code), flags)
1335     decls = nolink_iop.subst('BasicDeclare')
1336
1337     # Generate declaration of '*AndLink' version, append to decls
1338     link_code = 'Ra = NPC & ~3;\n' + nolink_code
1339     link_iop = InstObjParams(name, Name + 'AndLink', base_class,
1340                              CodeBlock(link_code), flags)
1341     decls += link_iop.subst('BasicDeclare')
1342
1343     # need to use link_iop for the decode template since it is expecting
1344     # the shorter version of class_name (w/o "AndLink")
1345     return (decls, nolink_iop.subst('JumpOrBranchDecode'))
1346 }};
1347
1348 def format UncondBranch(*flags) {{
1349     flags += ('IsUncondControl', 'IsDirectControl')
1350     return UncondCtrlBase(name, Name, 'Branch', 'NPC + disp', flags)
1351 }};
1352
1353 def format Jump(*flags) {{
1354     flags += ('IsUncondControl', 'IsIndirectControl')
1355     return UncondCtrlBase(name, Name, 'Jump', '(Rb & ~3) | (NPC & 1)', flags)
1356 }};
1357
1358
1359 declare {{
1360     /**
1361      * Base class for emulated call_pal calls (used only in
1362      * non-full-system mode).
1363      */
1364     class EmulatedCallPal : public AlphaStaticInst
1365     {
1366       protected:
1367
1368         /// Constructor.
1369         EmulatedCallPal(const char *mnem, MachInst _machInst,
1370                         OpClass __opClass)
1371             : AlphaStaticInst(mnem, _machInst, __opClass)
1372         {
1373         }
1374
1375         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
1376         {
1377 #ifdef SS_COMPATIBLE_DISASSEMBLY
1378             return csprintf("%s %s", "call_pal", mnemonic);
1379 #else
1380             return csprintf("%-10s %s", "call_pal", mnemonic);
1381 #endif
1382         }
1383     };
1384 }};
1385
1386 def format EmulatedCallPal(code) {{
1387     iop = InstObjParams(name, Name, 'EmulatedCallPal', CodeBlock(code))
1388     return iop.subst('BasicDeclare', 'BasicDecode')
1389 }};
1390
1391 declare {{
1392     /**
1393      * Base class for full-system-mode call_pal instructions.
1394      * Probably could turn this into a leaf class and get rid of the
1395      * parser template.
1396      */
1397     class CallPalBase : public AlphaStaticInst
1398     {
1399       protected:
1400         int palFunc;    ///< Function code part of instruction
1401         int palOffset;  ///< Target PC, offset from IPR_PAL_BASE
1402         bool palValid;  ///< is the function code valid?
1403         bool palPriv;   ///< is this call privileged?
1404
1405         /// Constructor.
1406         CallPalBase(const char *mnem, MachInst _machInst,
1407                     OpClass __opClass)
1408             : AlphaStaticInst(mnem, _machInst, __opClass),
1409               palFunc(PALFUNC)
1410         {
1411             // From the 21164 HRM (paraphrased):
1412             // Bit 7 of the function code (mask 0x80) indicates
1413             // whether the call is privileged (bit 7 == 0) or
1414             // unprivileged (bit 7 == 1).  The privileged call table
1415             // starts at 0x2000, the unprivielged call table starts at
1416             // 0x3000.  Bits 5-0 (mask 0x3f) are used to calculate the
1417             // offset.
1418             const int palPrivMask = 0x80;
1419             const int palOffsetMask = 0x3f;
1420
1421             // Pal call is invalid unless all other bits are 0
1422             palValid = ((machInst & ~(palPrivMask | palOffsetMask)) == 0);
1423             palPriv = ((machInst & palPrivMask) == 0);
1424             int shortPalFunc = (machInst & palOffsetMask);
1425             // Add 1 to base to set pal-mode bit
1426             palOffset = (palPriv ? 0x2001 : 0x3001) + (shortPalFunc << 6);
1427         }
1428
1429         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
1430         {
1431             return csprintf("%-10s %#x", "call_pal", palFunc);
1432         }
1433     };
1434 }};
1435
1436
1437 def format CallPal(code) {{
1438     iop = InstObjParams(name, Name, 'CallPalBase', CodeBlock(code))
1439     return iop.subst('BasicDeclare', 'BasicDecode')
1440 }};
1441
1442 //
1443 // hw_ld, hw_st
1444 //
1445 declare {{
1446     /**
1447      * Base class for hw_ld and hw_st.
1448      */
1449     class HwLoadStore : public AlphaStaticInst
1450     {
1451       protected:
1452
1453         /// Displacement for EA calculation (signed).
1454         int16_t disp;
1455         /// Memory request flags.  See mem_req_base.hh.
1456         unsigned memAccessFlags;
1457
1458         /// Constructor
1459         HwLoadStore(const char *mnem, MachInst _machInst, OpClass __opClass)
1460             : AlphaStaticInst(mnem, _machInst, __opClass), disp(HW_LDST_DISP)
1461         {
1462             memAccessFlags = 0;
1463             if (HW_LDST_PHYS) memAccessFlags |= PHYSICAL;
1464             if (HW_LDST_ALT)  memAccessFlags |= ALTMODE;
1465             if (HW_LDST_VPTE) memAccessFlags |= VPTE;
1466             if (HW_LDST_LOCK) memAccessFlags |= LOCKED;
1467         }
1468
1469         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
1470         {
1471 #ifdef SS_COMPATIBLE_DISASSEMBLY
1472             return csprintf("%-10s r%d,%d(r%d)", mnemonic, RA, disp, RB);
1473 #else
1474             // HW_LDST_LOCK and HW_LDST_COND are the same bit.
1475             const char *lock_str =
1476                 (HW_LDST_LOCK) ? (flags[IsLoad] ? ",LOCK" : ",COND") : "";
1477
1478             return csprintf("%-10s r%d,%d(r%d)%s%s%s%s%s",
1479                             mnemonic, RA, disp, RB,
1480                             HW_LDST_PHYS ? ",PHYS" : "",
1481                             HW_LDST_ALT ? ",ALT" : "",
1482                             HW_LDST_QUAD ? ",QUAD" : "",
1483                             HW_LDST_VPTE ? ",VPTE" : "",
1484                             lock_str);
1485 #endif
1486         }
1487     };
1488 }};
1489
1490
1491 def format HwLoadStore(ea_code, memacc_code, class_ext, *flags) {{
1492     return LoadStoreBase(name, Name + class_ext, ea_code, memacc_code,
1493                          flags = flags,
1494                          base_class = 'HwLoadStore')
1495 }};
1496
1497
1498 def format HwStoreCond(ea_code, memacc_code, postacc_code, class_ext, *flags) {{
1499     return LoadStoreBase(name, Name + class_ext,
1500                          ea_code, memacc_code, postacc_code,
1501                          flags = flags,
1502                          base_class = 'HwLoadStore')
1503 }};
1504
1505
1506 declare {{
1507     /**
1508      * Base class for hw_mfpr and hw_mtpr.
1509      */
1510     class HwMoveIPR : public AlphaStaticInst
1511     {
1512       protected:
1513         /// Index of internal processor register.
1514         int ipr_index;
1515
1516         /// Constructor
1517         HwMoveIPR(const char *mnem, MachInst _machInst, OpClass __opClass)
1518             : AlphaStaticInst(mnem, _machInst, __opClass),
1519               ipr_index(HW_IPR_IDX)
1520         {
1521         }
1522
1523         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
1524         {
1525             if (_numSrcRegs > 0) {
1526                 // must be mtpr
1527                 return csprintf("%-10s r%d,IPR(%#x)",
1528                                 mnemonic, RA, ipr_index);
1529             }
1530             else {
1531                 // must be mfpr
1532                 return csprintf("%-10s IPR(%#x),r%d",
1533                                 mnemonic, ipr_index, RA);
1534             }
1535         }
1536     };
1537 }};
1538
1539 def format HwMoveIPR(code) {{
1540     iop = InstObjParams(name, Name, 'HwMoveIPR', CodeBlock(code))
1541     return iop.subst('BasicDeclare', 'BasicDecode')
1542 }};
1543
1544 declare {{
1545     /**
1546      * Static instruction class for unimplemented instructions that
1547      * cause simulator termination.  Note that these are recognized
1548      * (legal) instructions that the simulator does not support; the
1549      * 'Unknown' class is used for unrecognized/illegal instructions.
1550      * This is a leaf class.
1551      */
1552     class FailUnimplemented : public AlphaStaticInst
1553     {
1554       public:
1555         /// Constructor
1556         FailUnimplemented(const char *_mnemonic, MachInst _machInst)
1557             : AlphaStaticInst(_mnemonic, _machInst, No_OpClass)
1558         {
1559         }
1560
1561         Fault execute(SimpleCPU *cpu, ExecContext *xc,
1562                       Trace::InstRecord *traceData)
1563         {
1564             panic("attempt to execute unimplemented instruction '%s' "
1565                   "(inst 0x%08x, opcode 0x%x)", mnemonic, machInst, OPCODE);
1566             return Unimplemented_Opcode_Fault;
1567         }
1568
1569         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
1570                       Trace::InstRecord *traceData)
1571         {
1572             // don't panic if this is a misspeculated instruction
1573             if (!xc->spec_mode)
1574                 panic("attempt to execute unimplemented instruction '%s' "
1575                       "(inst 0x%08x, opcode 0x%x)",
1576                       mnemonic, machInst, OPCODE);
1577             return Unimplemented_Opcode_Fault;
1578         }
1579
1580         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
1581         {
1582             return csprintf("%-10s (unimplemented)", mnemonic);
1583         }
1584     };
1585
1586     /**
1587      * Base class for unimplemented instructions that cause a warning
1588      * to be printed (but do not terminate simulation).  This
1589      * implementation is a little screwy in that it will print a
1590      * warning for each instance of a particular unimplemented machine
1591      * instruction, not just for each unimplemented opcode.  Should
1592      * probably make the 'warned' flag a static member of the derived
1593      * class.
1594      */
1595     class WarnUnimplemented : public AlphaStaticInst
1596     {
1597       private:
1598         /// Have we warned on this instruction yet?
1599         bool warned;
1600
1601       public:
1602         /// Constructor
1603         WarnUnimplemented(const char *_mnemonic, MachInst _machInst)
1604             : AlphaStaticInst(_mnemonic, _machInst, No_OpClass), warned(false)
1605         {
1606         }
1607
1608         Fault execute(SimpleCPU *cpu, ExecContext *xc,
1609                       Trace::InstRecord *traceData)
1610         {
1611             if (!warned) {
1612                 warn("instruction '%s' unimplemented\n", mnemonic);
1613                 warned = true;
1614             }
1615
1616             return No_Fault;
1617         }
1618
1619         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
1620                       Trace::InstRecord *traceData)
1621         {
1622             if (!xc->spec_mode && !warned) {
1623                 warn("instruction '%s' unimplemented\n", mnemonic);
1624                 warned = true;
1625             }
1626
1627             return No_Fault;
1628         }
1629
1630         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
1631         {
1632 #ifdef SS_COMPATIBLE_DISASSEMBLY
1633             return csprintf("%-10s", mnemonic);
1634 #else
1635             return csprintf("%-10s (unimplemented)", mnemonic);
1636 #endif
1637         }
1638     };
1639 }};
1640
1641 def template WarnUnimplDeclare {{
1642     /**
1643      * Static instruction class for "%(mnemonic)s".
1644      */
1645     class %(class_name)s : public %(base_class)s
1646     {
1647       public:
1648         /// Constructor
1649         %(class_name)s(MachInst machInst)
1650              : %(base_class)s("%(mnemonic)s", machInst)
1651         {
1652         }
1653     };
1654 }};
1655
1656
1657 def format FailUnimpl() {{
1658     iop = InstObjParams(name, 'FailUnimplemented')
1659     return ('', iop.subst('BasicDecodeWithMnemonic'))
1660 }};
1661
1662 def format WarnUnimpl() {{
1663     iop = InstObjParams(name, Name, 'WarnUnimplemented')
1664     return iop.subst('WarnUnimplDeclare', 'BasicDecode')
1665 }};
1666
1667 declare {{
1668     /**
1669      * Static instruction class for unknown (illegal) instructions.
1670      * These cause simulator termination if they are executed in a
1671      * non-speculative mode.  This is a leaf class.
1672      */
1673     class Unknown : public AlphaStaticInst
1674     {
1675       public:
1676         /// Constructor
1677         Unknown(MachInst _machInst)
1678             : AlphaStaticInst("unknown", _machInst, No_OpClass)
1679         {
1680         }
1681
1682         Fault execute(SimpleCPU *cpu, ExecContext *xc,
1683                       Trace::InstRecord *traceData)
1684         {
1685             panic("attempt to execute unknown instruction "
1686                   "(inst 0x%08x, opcode 0x%x)", machInst, OPCODE);
1687             return Unimplemented_Opcode_Fault;
1688         }
1689
1690         Fault execute(FullCPU *cpu, SpecExecContext *xc, DynInst *dynInst,
1691                       Trace::InstRecord *traceData)
1692         {
1693             // don't panic if this is a misspeculated instruction
1694             if (!xc->spec_mode)
1695                 panic("attempt to execute unknown instruction "
1696                       "(inst 0x%08x, opcode 0x%x)", machInst, OPCODE);
1697             return Unimplemented_Opcode_Fault;
1698         }
1699
1700         std::string generateDisassembly(Addr pc, const SymbolTable *symtab)
1701         {
1702             return csprintf("%-10s (inst 0x%x, opcode 0x%x)",
1703                             "unknown", machInst, OPCODE);
1704         }
1705     };
1706 }};
1707
1708 def format Unknown() {{
1709     return ('', 'return new Unknown(machInst);\n')
1710 }};
1711
1712 declare {{
1713
1714     /// Return opa + opb, summing carry into third arg.
1715     inline uint64_t
1716     addc(uint64_t opa, uint64_t opb, int &carry)
1717     {
1718         uint64_t res = opa + opb;
1719         if (res < opa || res < opb)
1720             ++carry;
1721         return res;
1722     }
1723
1724     /// Multiply two 64-bit values (opa * opb), returning the 128-bit
1725     /// product in res_hi and res_lo.
1726     void
1727     mul128(uint64_t opa, uint64_t opb, uint64_t &res_hi, uint64_t &res_lo)
1728     {
1729         // do a 64x64 --> 128 multiply using four 32x32 --> 64 multiplies
1730         uint64_t opa_hi = opa<63:32>;
1731         uint64_t opa_lo = opa<31:0>;
1732         uint64_t opb_hi = opb<63:32>;
1733         uint64_t opb_lo = opb<31:0>;
1734
1735         res_lo = opa_lo * opb_lo;
1736
1737         // The middle partial products logically belong in bit
1738         // positions 95 to 32.  Thus the lower 32 bits of each product
1739         // sum into the upper 32 bits of the low result, while the
1740         // upper 32 sum into the low 32 bits of the upper result.
1741         uint64_t partial1 = opa_hi * opb_lo;
1742         uint64_t partial2 = opa_lo * opb_hi;
1743
1744         uint64_t partial1_lo = partial1<31:0> << 32;
1745         uint64_t partial1_hi = partial1<63:32>;
1746         uint64_t partial2_lo = partial2<31:0> << 32;
1747         uint64_t partial2_hi = partial2<63:32>;
1748
1749         // Add partial1_lo and partial2_lo to res_lo, keeping track
1750         // of any carries out
1751         int carry_out = 0;
1752         res_lo = addc(partial1_lo, res_lo, carry_out);
1753         res_lo = addc(partial2_lo, res_lo, carry_out);
1754
1755         // Now calculate the high 64 bits...
1756         res_hi = (opa_hi * opb_hi) + partial1_hi + partial2_hi + carry_out;
1757     }
1758
1759     /// Map 8-bit S-floating exponent to 11-bit T-floating exponent.
1760     /// See Table 2-2 of Alpha AHB.
1761     inline int
1762     map_s(int old_exp)
1763     {
1764         int hibit = old_exp<7:>;
1765         int lobits = old_exp<6:0>;
1766
1767         if (hibit == 1) {
1768             return (lobits == 0x7f) ? 0x7ff : (0x400 | lobits);
1769         }
1770         else {
1771             return (lobits == 0) ? 0 : (0x380 | lobits);
1772         }
1773     }
1774
1775     /// Convert a 32-bit S-floating value to the equivalent 64-bit
1776     /// representation to be stored in an FP reg.
1777     inline uint64_t
1778     s_to_t(uint32_t s_val)
1779     {
1780         uint64_t tmp = s_val;
1781         return (tmp<31:> << 63 // sign bit
1782                 | (uint64_t)map_s(tmp<30:23>) << 52 // exponent
1783                 | tmp<22:0> << 29); // fraction
1784     }
1785
1786     /// Convert a 64-bit T-floating value to the equivalent 32-bit
1787     /// S-floating representation to be stored in memory.
1788     inline int32_t
1789     t_to_s(uint64_t t_val)
1790     {
1791         return (t_val<63:62> << 30   // sign bit & hi exp bit
1792                 | t_val<58:29>);     // rest of exp & fraction
1793     }
1794 }};
1795
1796 decode OPCODE default Unknown::unknown() {
1797
1798     format LoadAddress {
1799         0x08: lda({{ Ra = Rb + disp; }});
1800         0x09: ldah({{ Ra = Rb + (disp << 16); }});
1801     }
1802
1803     format LoadOrNop {
1804         0x0a: ldbu({{ EA = Rb + disp; }}, {{ Ra.uq = Mem.ub; }});
1805         0x0c: ldwu({{ EA = Rb + disp; }}, {{ Ra.uq = Mem.uw; }});
1806         0x0b: ldq_u({{ EA = (Rb + disp) & ~7; }}, {{ Ra = Mem.uq; }});
1807         0x23: ldt({{ EA = Rb + disp; }}, {{ Fa = Mem.df; }});
1808         0x2a: ldl_l({{ EA = Rb + disp; }}, {{ Ra.sl = Mem.sl; }}, LOCKED);
1809         0x2b: ldq_l({{ EA = Rb + disp; }}, {{ Ra.uq = Mem.uq; }}, LOCKED);
1810     }
1811
1812     format LoadOrPrefetch {
1813         0x28: ldl({{ EA = Rb + disp; }}, {{ Ra.sl = Mem.sl; }});
1814         0x29: ldq({{ EA = Rb + disp; }}, {{ Ra.uq = Mem.uq; }}, EVICT_NEXT);
1815         // IsFloating flag on lds gets the prefetch to disassemble
1816         // using f31 instead of r31... funcitonally it's unnecessary
1817         0x22: lds({{ EA = Rb + disp; }}, {{ Fa.uq = s_to_t(Mem.ul); }},
1818                   PF_EXCLUSIVE, IsFloating);
1819     }
1820
1821     format Store {
1822         0x0e: stb({{ EA = Rb + disp; }}, {{ Mem.ub = Ra<7:0>; }});
1823         0x0d: stw({{ EA = Rb + disp; }}, {{ Mem.uw = Ra<15:0>; }});
1824         0x2c: stl({{ EA = Rb + disp; }}, {{ Mem.ul = Ra<31:0>; }});
1825         0x2d: stq({{ EA = Rb + disp; }}, {{ Mem.uq = Ra.uq; }});
1826         0x0f: stq_u({{ EA = (Rb + disp) & ~7; }}, {{ Mem.uq = Ra.uq; }});
1827         0x26: sts({{ EA = Rb + disp; }}, {{ Mem.ul = t_to_s(Fa.uq); }});
1828         0x27: stt({{ EA = Rb + disp; }}, {{ Mem.df = Fa; }});
1829     }
1830
1831     format StoreCond {
1832         0x2e: stl_c({{ EA = Rb + disp; }}, {{ Mem.ul = Ra<31:0>; }},
1833                     {{
1834                         uint64_t tmp = Mem_write_result;
1835                         // see stq_c
1836                         Ra = (tmp == 0 || tmp == 1) ? tmp : Ra;
1837                     }}, LOCKED);
1838         0x2f: stq_c({{ EA = Rb + disp; }}, {{ Mem.uq = Ra; }},
1839                     {{
1840                         uint64_t tmp = Mem_write_result;
1841                         // If the write operation returns 0 or 1, then
1842                         // this was a conventional store conditional,
1843                         // and the value indicates the success/failure
1844                         // of the operation.  If another value is
1845                         // returned, then this was a Turbolaser
1846                         // mailbox access, and we don't update the
1847                         // result register at all.
1848                         Ra = (tmp == 0 || tmp == 1) ? tmp : Ra;
1849                     }}, LOCKED);
1850     }
1851
1852     format IntegerOperate {
1853
1854         0x10: decode INTFUNC {  // integer arithmetic operations
1855
1856             0x00: addl({{ Rc.sl = Ra.sl + Rb_or_imm.sl; }});
1857             0x40: addlv({{
1858                 uint32_t tmp  = Ra.sl + Rb_or_imm.sl;
1859                 // signed overflow occurs when operands have same sign
1860                 // and sign of result does not match.
1861                 if (Ra.sl<31:> == Rb_or_imm.sl<31:> && tmp<31:> != Ra.sl<31:>)
1862                     fault = Integer_Overflow_Fault;
1863                 Rc.sl = tmp;
1864             }});
1865             0x02: s4addl({{ Rc.sl = (Ra.sl << 2) + Rb_or_imm.sl; }});
1866             0x12: s8addl({{ Rc.sl = (Ra.sl << 3) + Rb_or_imm.sl; }});
1867
1868             0x20: addq({{ Rc = Ra + Rb_or_imm; }});
1869             0x60: addqv({{
1870                 uint64_t tmp = Ra + Rb_or_imm;
1871                 // signed overflow occurs when operands have same sign
1872                 // and sign of result does not match.
1873                 if (Ra<63:> == Rb_or_imm<63:> && tmp<63:> != Ra<63:>)
1874                     fault = Integer_Overflow_Fault;
1875                 Rc = tmp;
1876             }});
1877             0x22: s4addq({{ Rc = (Ra << 2) + Rb_or_imm; }});
1878             0x32: s8addq({{ Rc = (Ra << 3) + Rb_or_imm; }});
1879
1880             0x09: subl({{ Rc.sl = Ra.sl - Rb_or_imm.sl; }});
1881             0x49: sublv({{
1882                 uint32_t tmp  = Ra.sl - Rb_or_imm.sl;
1883                 // signed overflow detection is same as for add,
1884                 // except we need to look at the *complemented*
1885                 // sign bit of the subtrahend (Rb), i.e., if the initial
1886                 // signs are the *same* then no overflow can occur
1887                 if (Ra.sl<31:> != Rb_or_imm.sl<31:> && tmp<31:> != Ra.sl<31:>)
1888                     fault = Integer_Overflow_Fault;
1889                 Rc.sl = tmp;
1890             }});
1891             0x0b: s4subl({{ Rc.sl = (Ra.sl << 2) - Rb_or_imm.sl; }});
1892             0x1b: s8subl({{ Rc.sl = (Ra.sl << 3) - Rb_or_imm.sl; }});
1893
1894             0x29: subq({{ Rc = Ra - Rb_or_imm; }});
1895             0x69: subqv({{
1896                 uint64_t tmp  = Ra - Rb_or_imm;
1897                 // signed overflow detection is same as for add,
1898                 // except we need to look at the *complemented*
1899                 // sign bit of the subtrahend (Rb), i.e., if the initial
1900                 // signs are the *same* then no overflow can occur
1901                 if (Ra<63:> != Rb_or_imm<63:> && tmp<63:> != Ra<63:>)
1902                     fault = Integer_Overflow_Fault;
1903                 Rc = tmp;
1904             }});
1905             0x2b: s4subq({{ Rc = (Ra << 2) - Rb_or_imm; }});
1906             0x3b: s8subq({{ Rc = (Ra << 3) - Rb_or_imm; }});
1907
1908             0x2d: cmpeq({{ Rc = (Ra == Rb_or_imm); }});
1909             0x6d: cmple({{ Rc = (Ra.sq <= Rb_or_imm.sq); }});
1910             0x4d: cmplt({{ Rc = (Ra.sq <  Rb_or_imm.sq); }});
1911             0x3d: cmpule({{ Rc = (Ra.uq <= Rb_or_imm.uq); }});
1912             0x1d: cmpult({{ Rc = (Ra.uq <  Rb_or_imm.uq); }});
1913
1914             0x0f: cmpbge({{
1915                 int hi = 7;
1916                 int lo = 0;
1917                 uint64_t tmp = 0;
1918                 for (int i = 0; i < 8; ++i) {
1919                     tmp |= (Ra.uq<hi:lo> >= Rb_or_imm.uq<hi:lo>) << i;
1920                     hi += 8;
1921                     lo += 8;
1922                 }
1923                 Rc = tmp;
1924             }});
1925         }
1926
1927         0x11: decode INTFUNC {  // integer logical operations
1928
1929             0x00: and({{ Rc = Ra & Rb_or_imm; }});
1930             0x08: bic({{ Rc = Ra & ~Rb_or_imm; }});
1931             0x20: bis({{ Rc = Ra | Rb_or_imm; }});
1932             0x28: ornot({{ Rc = Ra | ~Rb_or_imm; }});
1933             0x40: xor({{ Rc = Ra ^ Rb_or_imm; }});
1934             0x48: eqv({{ Rc = Ra ^ ~Rb_or_imm; }});
1935
1936             // conditional moves
1937             0x14: cmovlbs({{ Rc = ((Ra & 1) == 1) ? Rb_or_imm : Rc; }});
1938             0x16: cmovlbc({{ Rc = ((Ra & 1) == 0) ? Rb_or_imm : Rc; }});
1939             0x24: cmoveq({{ Rc = (Ra == 0) ? Rb_or_imm : Rc; }});
1940             0x26: cmovne({{ Rc = (Ra != 0) ? Rb_or_imm : Rc; }});
1941             0x44: cmovlt({{ Rc = (Ra.sq <  0) ? Rb_or_imm : Rc; }});
1942             0x46: cmovge({{ Rc = (Ra.sq >= 0) ? Rb_or_imm : Rc; }});
1943             0x64: cmovle({{ Rc = (Ra.sq <= 0) ? Rb_or_imm : Rc; }});
1944             0x66: cmovgt({{ Rc = (Ra.sq >  0) ? Rb_or_imm : Rc; }});
1945
1946             // For AMASK, RA must be R31.
1947             0x61: decode RA {
1948                 31: amask({{ Rc = Rb_or_imm & ~ULL(0x17); }});
1949             }
1950
1951             // For IMPLVER, RA must be R31 and the B operand
1952             // must be the immediate value 1.
1953             0x6c: decode RA {
1954                 31: decode IMM {
1955                     1: decode INTIMM {
1956                         // return EV5 for FULL_SYSTEM and EV6 otherwise
1957                         1: implver({{
1958 #ifdef FULL_SYSTEM
1959                              Rc = 1;
1960 #else
1961                              Rc = 2;
1962 #endif
1963                         }});
1964                     }
1965                 }
1966             }
1967
1968 #ifdef FULL_SYSTEM
1969             // The mysterious 11.25...
1970             0x25: WarnUnimpl::eleven25();
1971 #endif
1972         }
1973
1974         0x12: decode INTFUNC {
1975             0x39: sll({{ Rc = Ra << Rb_or_imm<5:0>; }});
1976             0x34: srl({{ Rc = Ra.uq >> Rb_or_imm<5:0>; }});
1977             0x3c: sra({{ Rc = Ra.sq >> Rb_or_imm<5:0>; }});
1978
1979             0x02: mskbl({{ Rc = Ra & ~(mask( 8) << (Rb_or_imm<2:0> * 8)); }});
1980             0x12: mskwl({{ Rc = Ra & ~(mask(16) << (Rb_or_imm<2:0> * 8)); }});
1981             0x22: mskll({{ Rc = Ra & ~(mask(32) << (Rb_or_imm<2:0> * 8)); }});
1982             0x32: mskql({{ Rc = Ra & ~(mask(64) << (Rb_or_imm<2:0> * 8)); }});
1983
1984             0x52: mskwh({{
1985                 int bv = Rb_or_imm<2:0>;
1986                 Rc =  bv ? (Ra & ~(mask(16) >> (64 - 8 * bv))) : Ra;
1987             }});
1988             0x62: msklh({{
1989                 int bv = Rb_or_imm<2:0>;
1990                 Rc =  bv ? (Ra & ~(mask(32) >> (64 - 8 * bv))) : Ra;
1991             }});
1992             0x72: mskqh({{
1993                 int bv = Rb_or_imm<2:0>;
1994                 Rc =  bv ? (Ra & ~(mask(64) >> (64 - 8 * bv))) : Ra;
1995             }});
1996
1997             0x06: extbl({{ Rc = (Ra.uq >> (Rb_or_imm<2:0> * 8))< 7:0>; }});
1998             0x16: extwl({{ Rc = (Ra.uq >> (Rb_or_imm<2:0> * 8))<15:0>; }});
1999             0x26: extll({{ Rc = (Ra.uq >> (Rb_or_imm<2:0> * 8))<31:0>; }});
2000             0x36: extql({{ Rc = (Ra.uq >> (Rb_or_imm<2:0> * 8)); }});
2001
2002             0x5a: extwh({{
2003                 Rc = (Ra << (64 - (Rb_or_imm<2:0> * 8))<5:0>)<15:0>; }});
2004             0x6a: extlh({{
2005                 Rc = (Ra << (64 - (Rb_or_imm<2:0> * 8))<5:0>)<31:0>; }});
2006             0x7a: extqh({{
2007                 Rc = (Ra << (64 - (Rb_or_imm<2:0> * 8))<5:0>); }});
2008
2009             0x0b: insbl({{ Rc = Ra< 7:0> << (Rb_or_imm<2:0> * 8); }});
2010             0x1b: inswl({{ Rc = Ra<15:0> << (Rb_or_imm<2:0> * 8); }});
2011             0x2b: insll({{ Rc = Ra<31:0> << (Rb_or_imm<2:0> * 8); }});
2012             0x3b: insql({{ Rc = Ra       << (Rb_or_imm<2:0> * 8); }});
2013
2014             0x57: inswh({{
2015                 int bv = Rb_or_imm<2:0>;
2016                 Rc = bv ? (Ra.uq<15:0> >> (64 - 8 * bv)) : 0;
2017             }});
2018             0x67: inslh({{
2019                 int bv = Rb_or_imm<2:0>;
2020                 Rc = bv ? (Ra.uq<31:0> >> (64 - 8 * bv)) : 0;
2021             }});
2022             0x77: insqh({{
2023                 int bv = Rb_or_imm<2:0>;
2024                 Rc = bv ? (Ra.uq       >> (64 - 8 * bv)) : 0;
2025             }});
2026
2027             0x30: zap({{
2028                 uint64_t zapmask = 0;
2029                 for (int i = 0; i < 8; ++i) {
2030                     if (Rb_or_imm<i:>)
2031                         zapmask |= (mask(8) << (i * 8));
2032                 }
2033                 Rc = Ra & ~zapmask;
2034             }});
2035             0x31: zapnot({{
2036                 uint64_t zapmask = 0;
2037                 for (int i = 0; i < 8; ++i) {
2038                     if (!Rb_or_imm<i:>)
2039                         zapmask |= (mask(8) << (i * 8));
2040                 }
2041                 Rc = Ra & ~zapmask;
2042             }});
2043         }
2044
2045         0x13: decode INTFUNC {  // integer multiplies
2046             0x00: mull({{ Rc.sl = Ra.sl * Rb_or_imm.sl; }}, IntMULT);
2047             0x20: mulq({{ Rc    = Ra    * Rb_or_imm;    }}, IntMULT);
2048             0x30: umulh({{
2049                 uint64_t hi, lo;
2050                 mul128(Ra, Rb_or_imm, hi, lo);
2051                 Rc = hi;
2052             }}, IntMULT);
2053             0x40: mullv({{
2054                 // 32-bit multiply with trap on overflow
2055                 int64_t Rax = Ra.sl;    // sign extended version of Ra.sl
2056                 int64_t Rbx = Rb_or_imm.sl;
2057                 int64_t tmp = Rax * Rbx;
2058                 // To avoid overflow, all the upper 32 bits must match
2059                 // the sign bit of the lower 32.  We code this as
2060                 // checking the upper 33 bits for all 0s or all 1s.
2061                 uint64_t sign_bits = tmp<63:31>;
2062                 if (sign_bits != 0 && sign_bits != mask(33))
2063                     fault = Integer_Overflow_Fault;
2064                 Rc.sl = tmp<31:0>;
2065             }}, IntMULT);
2066             0x60: mulqv({{
2067                 // 64-bit multiply with trap on overflow
2068                 uint64_t hi, lo;
2069                 mul128(Ra, Rb_or_imm, hi, lo);
2070                 // all the upper 64 bits must match the sign bit of
2071                 // the lower 64
2072                 if (!((hi == 0 && lo<63:> == 0) ||
2073                       (hi == mask(64) && lo<63:> == 1)))
2074                     fault = Integer_Overflow_Fault;
2075                 Rc = lo;
2076             }}, IntMULT);
2077         }
2078
2079         0x1c: decode INTFUNC {
2080             0x00: decode RA { 31: sextb({{ Rc.sb = Rb_or_imm< 7:0>; }}); }
2081             0x01: decode RA { 31: sextw({{ Rc.sw = Rb_or_imm<15:0>; }}); }
2082
2083             format FailUnimpl {
2084                 0x30: ctpop();
2085                 0x31: perr();
2086                 0x32: ctlz();
2087                 0x33: cttz();
2088                 0x34: unpkbw();
2089                 0x35: unpkbl();
2090                 0x36: pkwb();
2091                 0x37: pklb();
2092                 0x38: minsb8();
2093                 0x39: minsw4();
2094                 0x3a: minub8();
2095                 0x3b: minuw4();
2096                 0x3c: maxub8();
2097                 0x3d: maxuw4();
2098                 0x3e: maxsb8();
2099                 0x3f: maxsw4();
2100             }
2101
2102             format BasicOperateWithNopCheck {
2103                 0x70: decode RB {
2104                     31: ftoit({{ Rc = Fa.uq; }}, FloatCVT);
2105                 }
2106                 0x78: decode RB {
2107                     31: ftois({{ Rc.sl = t_to_s(Fa.uq); }},
2108                               FloatCVT);
2109                 }
2110             }
2111         }
2112     }
2113
2114     // Conditional branches.
2115     format CondBranch {
2116         0x39: beq({{ cond = (Ra == 0); }});
2117         0x3d: bne({{ cond = (Ra != 0); }});
2118         0x3e: bge({{ cond = (Ra.sq >= 0); }});
2119         0x3f: bgt({{ cond = (Ra.sq >  0); }});
2120         0x3b: ble({{ cond = (Ra.sq <= 0); }});
2121         0x3a: blt({{ cond = (Ra.sq < 0); }});
2122         0x38: blbc({{ cond = ((Ra & 1) == 0); }});
2123         0x3c: blbs({{ cond = ((Ra & 1) == 1); }});
2124
2125         0x31: fbeq({{ cond = (Fa == 0); }});
2126         0x35: fbne({{ cond = (Fa != 0); }});
2127         0x36: fbge({{ cond = (Fa >= 0); }});
2128         0x37: fbgt({{ cond = (Fa >  0); }});
2129         0x33: fble({{ cond = (Fa <= 0); }});
2130         0x32: fblt({{ cond = (Fa < 0); }});
2131     }
2132
2133     // unconditional branches
2134     format UncondBranch {
2135         0x30: br();
2136         0x34: bsr(IsCall);
2137     }
2138
2139     // indirect branches
2140     0x1a: decode JMPFUNC {
2141         format Jump {
2142             0: jmp();
2143             1: jsr(IsCall);
2144             2: ret(IsReturn);
2145             3: jsr_coroutine(IsCall, IsReturn);
2146         }
2147     }
2148
2149     // IEEE floating point
2150     0x14: decode FP_SHORTFUNC {
2151         // Integer to FP register moves must have RB == 31
2152         0x4: decode RB {
2153             31: decode FP_FULLFUNC {
2154                 format BasicOperateWithNopCheck {
2155                     0x004: itofs({{ Fc.uq = s_to_t(Ra.ul); }}, FloatCVT);
2156                     0x024: itoft({{ Fc.uq = Ra.uq; }}, FloatCVT);
2157                     0x014: FailUnimpl::itoff(); // VAX-format conversion
2158                 }
2159             }
2160         }
2161
2162         // Square root instructions must have FA == 31
2163         0xb: decode FA {
2164             31: decode FP_TYPEFUNC {
2165                 format FloatingPointOperate {
2166 #ifdef SS_COMPATIBLE_FP
2167                     0x0b: sqrts({{
2168                         if (Fb < 0.0)
2169                             fault = Arithmetic_Fault;
2170                         Fc = sqrt(Fb);
2171                     }}, FloatSQRT);
2172 #else
2173                     0x0b: sqrts({{
2174                         if (Fb.sf < 0.0)
2175                             fault = Arithmetic_Fault;
2176                         Fc.sf = sqrt(Fb.sf);
2177                     }}, FloatSQRT);
2178 #endif
2179                     0x2b: sqrtt({{
2180                         if (Fb < 0.0)
2181                             fault = Arithmetic_Fault;
2182                         Fc = sqrt(Fb);
2183                     }}, FloatSQRT);
2184                 }
2185             }
2186         }
2187
2188         // VAX-format sqrtf and sqrtg are not implemented
2189         0xa: FailUnimpl::sqrtfg();
2190     }
2191
2192     // IEEE floating point
2193     0x16: decode FP_SHORTFUNC_TOP2 {
2194         // The top two bits of the short function code break this space
2195         // into four groups: binary ops, compares, reserved, and conversions.
2196         // See Table 4-12 of AHB.
2197         // Most of these instructions may have various trapping and
2198         // rounding mode flags set; these are decoded in the
2199         // FloatingPointDecode template used by the
2200         // FloatingPointOperate format.
2201
2202         // add/sub/mul/div: just decode on the short function code
2203         // and source type.
2204         0: decode FP_TYPEFUNC {
2205             format FloatingPointOperate {
2206 #ifdef SS_COMPATIBLE_FP
2207                 0x00: adds({{ Fc = Fa + Fb; }});
2208                 0x01: subs({{ Fc = Fa - Fb; }});
2209                 0x02: muls({{ Fc = Fa * Fb; }}, FloatMULT);
2210                 0x03: divs({{ Fc = Fa / Fb; }}, FloatDIV);
2211 #else
2212                 0x00: adds({{ Fc.sf = Fa.sf + Fb.sf; }});
2213                 0x01: subs({{ Fc.sf = Fa.sf - Fb.sf; }});
2214                 0x02: muls({{ Fc.sf = Fa.sf * Fb.sf; }}, FloatMULT);
2215                 0x03: divs({{ Fc.sf = Fa.sf / Fb.sf; }}, FloatDIV);
2216 #endif
2217
2218                 0x20: addt({{ Fc = Fa + Fb; }});
2219                 0x21: subt({{ Fc = Fa - Fb; }});
2220                 0x22: mult({{ Fc = Fa * Fb; }}, FloatMULT);
2221                 0x23: divt({{ Fc = Fa / Fb; }}, FloatDIV);
2222             }
2223         }
2224
2225         // Floating-point compare instructions must have the default
2226         // rounding mode, and may use the default trapping mode or
2227         // /SU.  Both trapping modes are treated the same by M5; the
2228         // only difference on the real hardware (as far a I can tell)
2229         // is that without /SU you'd get an imprecise trap if you
2230         // tried to compare a NaN with something else (instead of an
2231         // "unordered" result).
2232         1: decode FP_FULLFUNC {
2233             format BasicOperateWithNopCheck {
2234                 0x0a5, 0x5a5: cmpteq({{ Fc = (Fa == Fb) ? 2.0 : 0.0; }},
2235                                      FloatCMP);
2236                 0x0a7, 0x5a7: cmptle({{ Fc = (Fa <= Fb) ? 2.0 : 0.0; }},
2237                                      FloatCMP);
2238                 0x0a6, 0x5a6: cmptlt({{ Fc = (Fa <  Fb) ? 2.0 : 0.0; }},
2239                                      FloatCMP);
2240                 0x0a4, 0x5a4: cmptun({{ // unordered
2241                     Fc = (!(Fa < Fb) && !(Fa == Fb) && !(Fa > Fb)) ? 2.0 : 0.0;
2242                 }}, FloatCMP);
2243             }
2244         }
2245
2246         // The FP-to-integer and integer-to-FP conversion insts
2247         // require that FA be 31.
2248         3: decode FA {
2249             31: decode FP_TYPEFUNC {
2250                 format FloatingPointOperate {
2251                     0x2f: cvttq({{ Fc.sq = (int64_t)rint(Fb); }});
2252
2253                     // The cvtts opcode is overloaded to be cvtst if the trap
2254                     // mode is 2 or 6 (which are not valid otherwise)
2255                     0x2c: decode FP_FULLFUNC {
2256                         format BasicOperateWithNopCheck {
2257                             // trap on denorm version "cvtst/s" is
2258                             // simulated same as cvtst
2259                             0x2ac, 0x6ac: cvtst({{ Fc = Fb.sf; }});
2260                         }
2261                       default: cvtts({{ Fc.sf = Fb; }});
2262                     }
2263
2264                     // The trapping mode for integer-to-FP conversions
2265                     // must be /SUI or nothing; /U and /SU are not
2266                     // allowed.  The full set of rounding modes are
2267                     // supported though.
2268                     0x3c: decode FP_TRAPMODE {
2269                         0,7: cvtqs({{ Fc.sf = Fb.sq; }});
2270                     }
2271                     0x3e: decode FP_TRAPMODE {
2272                         0,7: cvtqt({{ Fc    = Fb.sq; }});
2273                     }
2274                 }
2275             }
2276         }
2277     }
2278
2279     // misc FP operate
2280     0x17: decode FP_FULLFUNC {
2281         format BasicOperateWithNopCheck {
2282             0x010: cvtlq({{
2283                 Fc.sl = (Fb.uq<63:62> << 30) | Fb.uq<58:29>;
2284             }});
2285             0x030: cvtql({{
2286                 Fc.uq = (Fb.uq<31:30> << 62) | (Fb.uq<29:0> << 29);
2287             }});
2288
2289             // We treat the precise & imprecise trapping versions of
2290             // cvtql identically.
2291             0x130, 0x530: cvtqlv({{
2292                 // To avoid overflow, all the upper 32 bits must match
2293                 // the sign bit of the lower 32.  We code this as
2294                 // checking the upper 33 bits for all 0s or all 1s.
2295                 uint64_t sign_bits = Fb.uq<63:31>;
2296                 if (sign_bits != 0 && sign_bits != mask(33))
2297                     fault = Integer_Overflow_Fault;
2298                 Fc.uq = (Fb.uq<31:30> << 62) | (Fb.uq<29:0> << 29);
2299             }});
2300
2301             0x020: cpys({{  // copy sign
2302                 Fc.uq = (Fa.uq<63:> << 63) | Fb.uq<62:0>;
2303             }});
2304             0x021: cpysn({{ // copy sign negated
2305                 Fc.uq = (~Fa.uq<63:> << 63) | Fb.uq<62:0>;
2306             }});
2307             0x022: cpyse({{ // copy sign and exponent
2308                 Fc.uq = (Fa.uq<63:52> << 52) | Fb.uq<51:0>;
2309             }});
2310
2311             0x02a: fcmoveq({{ Fc = (Fa == 0) ? Fb : Fc; }});
2312             0x02b: fcmovne({{ Fc = (Fa != 0) ? Fb : Fc; }});
2313             0x02c: fcmovlt({{ Fc = (Fa <  0) ? Fb : Fc; }});
2314             0x02d: fcmovge({{ Fc = (Fa >= 0) ? Fb : Fc; }});
2315             0x02e: fcmovle({{ Fc = (Fa <= 0) ? Fb : Fc; }});
2316             0x02f: fcmovgt({{ Fc = (Fa >  0) ? Fb : Fc; }});
2317
2318             0x024: mt_fpcr({{ FPCR = Fa.uq; }});
2319             0x025: mf_fpcr({{ Fa.uq = FPCR; }});
2320         }
2321     }
2322
2323     // miscellaneous mem-format ops
2324     0x18: decode MEMFUNC {
2325         format WarnUnimpl {
2326             0x0000: trapb();
2327             0x0400: excb();
2328             0x4000: mb();
2329             0x4400: wmb();
2330             0x8000: fetch();
2331             0xa000: fetch_m();
2332             0xe800: ecb();
2333         }
2334
2335         format MiscPrefetch {
2336             0xf800: wh64({{ EA = Rb; }},
2337                          {{ memAccessObj->writeHint(EA, 64); }},
2338                          IsMemRef, IsStore, WrPort);
2339         }
2340
2341         format BasicOperate {
2342             0xc000: rpcc({{ Ra = curTick; }});
2343         }
2344
2345 #ifdef FULL_SYSTEM
2346         format BasicOperate {
2347             0xe000: rc({{
2348                 Ra = xc->regs.intrflag;
2349                 if (!xc->misspeculating()) {
2350                     xc->regs.intrflag = 0;
2351                 }
2352             }}, No_OpClass);
2353             0xf000: rs({{
2354                 Ra = xc->regs.intrflag;
2355                 if (!xc->misspeculating()) {
2356                     xc->regs.intrflag = 1;
2357                 }
2358             }}, No_OpClass);
2359         }
2360 #else
2361         format FailUnimpl {
2362             0xe000: rc();
2363             0xf000: rs();
2364         }
2365 #endif
2366     }
2367
2368 #ifdef FULL_SYSTEM
2369     0x00: CallPal::call_pal({{
2370         if (!palValid ||
2371             (palPriv
2372              && xc->readIpr(AlphaISA::IPR_ICM, fault) != AlphaISA::mode_kernel)) {
2373             // invalid pal function code, or attempt to do privileged
2374             // PAL call in non-kernel mode
2375             fault = Unimplemented_Opcode_Fault;
2376         }
2377         else {
2378             bool dopal = true;
2379
2380             if (!xc->misspeculating()) {
2381                 // check to see if simulator wants to do something special
2382                 // on this PAL call (including maybe suppress it)
2383                 dopal = xc->simPalCheck(palFunc);
2384
2385                 Annotate::Callpal(xc, palFunc);
2386
2387                 if (dopal) {
2388                     AlphaISA::swap_palshadow(&xc->regs, true);
2389                     xc->setIpr(AlphaISA::IPR_EXC_ADDR, NPC);
2390                 }
2391             }
2392
2393             // if we're misspeculating, it's still safe (if
2394             // unrealistic) to set NPC, as the control-flow change
2395             // won't get committed.
2396             if (dopal) {
2397                 NPC = xc->readIpr(AlphaISA::IPR_PAL_BASE, fault) + palOffset;
2398             }
2399         }
2400     }});
2401 #else
2402     0x00: decode PALFUNC {
2403         format EmulatedCallPal {
2404             0x00: halt ({{
2405                 if (!xc->misspeculating())
2406                     SimExit(curTick, "halt instruction encountered");
2407             }});
2408             0x83: callsys({{
2409                 if (!xc->misspeculating())
2410                     xc->syscall();
2411             }});
2412             // Read uniq reg into ABI return value register (r0)
2413             0x9e: rduniq({{ R0 = Runiq; }});
2414             // Write uniq reg with value from ABI arg register (r16)
2415             0x9f: wruniq({{ Runiq = R16; }});
2416         }
2417     }
2418 #endif
2419
2420 #ifdef FULL_SYSTEM
2421     format HwLoadStore {
2422         0x1b: decode HW_LDST_QUAD {
2423             0: hw_ld({{ EA = (Rb + disp) & ~3; }}, {{ Ra = Mem.ul; }}, L);
2424             1: hw_ld({{ EA = (Rb + disp) & ~7; }}, {{ Ra = Mem.uq; }}, Q);
2425         }
2426
2427         0x1f: decode HW_LDST_COND {
2428             0: decode HW_LDST_QUAD {
2429                 0: hw_st({{ EA = (Rb + disp) & ~3; }},
2430                          {{ Mem.ul = Ra<31:0>; }}, L);
2431                 1: hw_st({{ EA = (Rb + disp) & ~7; }},
2432                          {{ Mem.uq = Ra.uq; }}, Q);
2433             }
2434
2435             1: FailUnimpl::hw_st_cond();
2436         }
2437     }
2438
2439     format BasicOperate {
2440         0x1e: hw_rei({{ xc->hwrei(); }});
2441
2442         // M5 special opcodes use the reserved 0x01 opcode space
2443         0x01: decode M5FUNC {
2444             0x00: arm({{
2445                 if (!xc->misspeculating()) {
2446                     Annotate::ARM(xc);
2447                     xc->kernelStats.arm();
2448                 }
2449             }});
2450             0x01: quiesce({{
2451                 if (!xc->misspeculating())
2452                     AlphaPseudo::quiesce(xc);
2453             }});
2454             0x10: ivlb({{
2455                 if (!xc->misspeculating()) {
2456                     Annotate::BeginInterval(xc);
2457                     xc->kernelStats.ivlb();
2458                 }
2459             }}, No_OpClass);
2460             0x11: ivle({{
2461                 if (!xc->misspeculating())
2462                     Annotate::EndInterval(xc);
2463             }}, No_OpClass);
2464             0x20: m5exit_old({{
2465                 if (!xc->misspeculating())
2466                     AlphaPseudo::m5exit_old(xc);
2467             }}, No_OpClass);
2468             0x21: m5exit({{
2469                 if (!xc->misspeculating())
2470                     AlphaPseudo::m5exit(xc);
2471             }}, No_OpClass);
2472             0x30: initparam({{ Ra = xc->cpu->system->init_param; }});
2473             0x40: resetstats({{
2474                 if (!xc->misspeculating())
2475                     AlphaPseudo::resetstats(xc);
2476             }});
2477             0x41: dumpstats({{
2478                 if (!xc->misspeculating())
2479                     AlphaPseudo::dumpstats(xc);
2480             }});
2481             0x42: dumpresetstats({{
2482                 if (!xc->misspeculating())
2483                     AlphaPseudo::dumpresetstats(xc);
2484             }});
2485             0x43: m5checkpoint({{
2486                 if (!xc->misspeculating())
2487                     AlphaPseudo::m5checkpoint(xc);
2488             }});
2489         }
2490     }
2491
2492     format HwMoveIPR {
2493         0x19: hw_mfpr({{
2494             // this instruction is only valid in PAL mode
2495             if (!PC_PAL(xc->regs.pc)) {
2496                 fault = Unimplemented_Opcode_Fault;
2497             }
2498             else {
2499                 Ra = xc->readIpr(ipr_index, fault);
2500             }
2501         }});
2502         0x1d: hw_mtpr({{
2503             // this instruction is only valid in PAL mode
2504             if (!PC_PAL(xc->regs.pc)) {
2505                 fault = Unimplemented_Opcode_Fault;
2506             }
2507             else {
2508                 xc->setIpr(ipr_index, Ra);
2509                 if (traceData) { traceData->setData(Ra); }
2510             }
2511         }});
2512     }
2513 #endif
2514 }