a79ce4e748
Reviewed-by: kvn, jbhateja, njian, ngasson
1957 lines
86 KiB
Python
1957 lines
86 KiB
Python
import os
|
|
import random
|
|
import subprocess
|
|
import sys
|
|
|
|
AARCH64_AS = "as"
|
|
AARCH64_OBJDUMP = "objdump"
|
|
AARCH64_OBJCOPY = "objcopy"
|
|
|
|
# These tables are legal immediate logical operands
|
|
immediates8 \
|
|
= [0x1, 0x0c, 0x3e, 0x60, 0x7c, 0x80, 0x83,
|
|
0xe1, 0xbf, 0xef, 0xf3, 0xfe]
|
|
|
|
immediates16 \
|
|
= [0x1, 0x38, 0x7e, 0xff, 0x1fc, 0x1ff, 0x3f0,
|
|
0x7e0, 0xfc0, 0x1f80, 0x3ff0, 0x7e00, 0x7e00,
|
|
0x8000, 0x81ff, 0xc1ff, 0xc003, 0xc7ff, 0xdfff,
|
|
0xe03f, 0xe10f, 0xe1ff, 0xf801, 0xfc00, 0xfc07,
|
|
0xff03, 0xfffe]
|
|
|
|
immediates32 \
|
|
= [0x1, 0x3f, 0x1f0, 0x7e0,
|
|
0x1c00, 0x3ff0, 0x8000, 0x1e000,
|
|
0x3e000, 0x78000, 0xe0000, 0x100000,
|
|
0x1fffe0, 0x3fe000, 0x780000, 0x7ffff8,
|
|
0xff8000, 0x1800180, 0x1fffc00, 0x3c003c0,
|
|
0x3ffff00, 0x7c00000, 0x7fffe00, 0xf000f00,
|
|
0xfffe000, 0x18181818, 0x1ffc0000, 0x1ffffffe,
|
|
0x3f003f00, 0x3fffe000, 0x60006000, 0x7f807f80,
|
|
0x7ffffc00, 0x800001ff, 0x803fffff, 0x9f9f9f9f,
|
|
0xc0000fff, 0xc0c0c0c0, 0xe0000000, 0xe003e003,
|
|
0xe3ffffff, 0xf0000fff, 0xf0f0f0f0, 0xf80000ff,
|
|
0xf83ff83f, 0xfc00007f, 0xfc1fffff, 0xfe0001ff,
|
|
0xfe3fffff, 0xff003fff, 0xff800003, 0xff87ff87,
|
|
0xffc00fff, 0xffe0000f, 0xffefffef, 0xfff1fff1,
|
|
0xfff83fff, 0xfffc0fff, 0xfffe0fff, 0xffff3fff,
|
|
0xffffc007, 0xffffe1ff, 0xfffff80f, 0xfffffe07,
|
|
0xffffffbf, 0xfffffffd]
|
|
|
|
immediates64 \
|
|
= [0x1, 0x1f80, 0x3fff0, 0x3ffffc,
|
|
0x3fe0000, 0x1ffc0000, 0xf8000000, 0x3ffffc000,
|
|
0xffffffe00, 0x3ffffff800, 0xffffc00000, 0x3f000000000,
|
|
0x7fffffff800, 0x1fe000001fe0, 0x3ffffff80000, 0xc00000000000,
|
|
0x1ffc000000000, 0x3ffff0003ffff, 0x7ffffffe00000, 0xfffffffffc000,
|
|
0x1ffffffffffc00, 0x3fffffffffff00, 0x7ffffffffffc00, 0xffffffffff8000,
|
|
0x1ffffffff800000, 0x3fffffc03fffffc, 0x7fffc0000000000, 0xff80ff80ff80ff8,
|
|
0x1c00000000000000, 0x1fffffffffff0000, 0x3fffff803fffff80, 0x7fc000007fc00000,
|
|
0x8000000000000000, 0x803fffff803fffff, 0xc000007fc000007f, 0xe00000000000ffff,
|
|
0xe3ffffffffffffff, 0xf007f007f007f007, 0xf80003ffffffffff, 0xfc000003fc000003,
|
|
0xfe000000007fffff, 0xff00000000007fff, 0xff800000000003ff, 0xffc00000000000ff,
|
|
0xffe00000000003ff, 0xfff0000000003fff, 0xfff80000001fffff, 0xfffc0000fffc0000,
|
|
0xfffe003fffffffff, 0xffff3fffffffffff, 0xffffc0000007ffff, 0xffffe01fffffe01f,
|
|
0xfffff800000007ff, 0xfffffc0fffffffff, 0xffffff00003fffff, 0xffffffc0000007ff,
|
|
0xfffffff0000001ff, 0xfffffffc00003fff, 0xffffffff07ffffff, 0xffffffffe003ffff,
|
|
0xfffffffffc01ffff, 0xffffffffffc00003, 0xfffffffffffc000f, 0xffffffffffffe07f]
|
|
|
|
class Operand(object):
|
|
|
|
def generate(self):
|
|
return self
|
|
|
|
class Register(Operand):
|
|
|
|
def generate(self):
|
|
self.number = random.randint(0, 30)
|
|
if self.number == 18:
|
|
self.number = 17
|
|
return self
|
|
|
|
def astr(self, prefix):
|
|
return prefix + str(self.number)
|
|
|
|
class FloatRegister(Register):
|
|
|
|
def __str__(self):
|
|
return self.astr("v")
|
|
|
|
def nextReg(self):
|
|
next = FloatRegister()
|
|
next.number = (self.number + 1) % 32
|
|
return next
|
|
|
|
class GeneralRegister(Register):
|
|
|
|
def __str__(self):
|
|
return self.astr("r")
|
|
|
|
class GeneralRegisterOrZr(Register):
|
|
|
|
def generate(self):
|
|
self.number = random.randint(0, 31)
|
|
if self.number == 18:
|
|
self.number = 16
|
|
return self
|
|
|
|
def astr(self, prefix = ""):
|
|
if (self.number == 31):
|
|
return prefix + "zr"
|
|
else:
|
|
return prefix + str(self.number)
|
|
|
|
def __str__(self):
|
|
if (self.number == 31):
|
|
return self.astr()
|
|
else:
|
|
return self.astr("r")
|
|
|
|
class GeneralRegisterOrSp(Register):
|
|
def generate(self):
|
|
self.number = random.randint(0, 31)
|
|
if self.number == 18:
|
|
self.number = 15
|
|
return self
|
|
|
|
def astr(self, prefix = ""):
|
|
if (self.number == 31):
|
|
return "sp"
|
|
else:
|
|
return prefix + str(self.number)
|
|
|
|
def __str__(self):
|
|
if (self.number == 31):
|
|
return self.astr()
|
|
else:
|
|
return self.astr("r")
|
|
|
|
class SVEVectorRegister(FloatRegister):
|
|
def __str__(self):
|
|
return self.astr("z")
|
|
|
|
class SVEPRegister(Register):
|
|
def __str__(self):
|
|
return self.astr("p")
|
|
|
|
def generate(self):
|
|
self.number = random.randint(0, 15)
|
|
return self
|
|
|
|
class SVEGoverningPRegister(Register):
|
|
def __str__(self):
|
|
return self.astr("p")
|
|
def generate(self):
|
|
self.number = random.randint(0, 7)
|
|
return self
|
|
|
|
class RegVariant(object):
|
|
def __init__(self, low, high):
|
|
self.number = random.randint(low, high)
|
|
|
|
def astr(self):
|
|
nameMap = {
|
|
0: ".b",
|
|
1: ".h",
|
|
2: ".s",
|
|
3: ".d",
|
|
4: ".q"
|
|
}
|
|
return nameMap.get(self.number)
|
|
|
|
def cstr(self):
|
|
nameMap = {
|
|
0: "__ B",
|
|
1: "__ H",
|
|
2: "__ S",
|
|
3: "__ D",
|
|
4: "__ Q"
|
|
}
|
|
return nameMap.get(self.number)
|
|
|
|
class FloatZero(Operand):
|
|
|
|
def __str__(self):
|
|
return "0.0"
|
|
|
|
def astr(self, ignored):
|
|
return "#0.0"
|
|
|
|
class OperandFactory:
|
|
|
|
_modes = {'x' : GeneralRegister,
|
|
'w' : GeneralRegister,
|
|
'b' : FloatRegister,
|
|
'h' : FloatRegister,
|
|
's' : FloatRegister,
|
|
'd' : FloatRegister,
|
|
'z' : FloatZero,
|
|
'p' : SVEPRegister,
|
|
'P' : SVEGoverningPRegister,
|
|
'Z' : SVEVectorRegister}
|
|
|
|
@classmethod
|
|
def create(cls, mode):
|
|
return OperandFactory._modes[mode]()
|
|
|
|
class ShiftKind:
|
|
|
|
def generate(self):
|
|
self.kind = ["LSL", "LSR", "ASR"][random.randint(0,2)]
|
|
return self
|
|
|
|
def cstr(self):
|
|
return self.kind
|
|
|
|
class Instruction(object):
|
|
|
|
def __init__(self, name):
|
|
self._name = name
|
|
self.isWord = name.endswith("w") | name.endswith("wi")
|
|
self.asmRegPrefix = ["x", "w"][self.isWord]
|
|
self.isPostfixException = False
|
|
|
|
def aname(self):
|
|
if self.isPostfixException:
|
|
return self._name
|
|
elif (self._name.endswith("wi")):
|
|
return self._name[:len(self._name)-2]
|
|
elif (self._name.endswith("i") | self._name.endswith("w")):
|
|
return self._name[:len(self._name)-1]
|
|
else:
|
|
return self._name
|
|
|
|
def emit(self) :
|
|
pass
|
|
|
|
def compare(self) :
|
|
pass
|
|
|
|
def generate(self) :
|
|
return self
|
|
|
|
def cstr(self):
|
|
return '__ %s(' % self.name()
|
|
|
|
def astr(self):
|
|
return '%s\t' % self.aname()
|
|
|
|
def name(self):
|
|
name = self._name
|
|
if name == "and":
|
|
name = "andr" # Special case: the name "and" can't be used
|
|
# in HotSpot, even for a member.
|
|
return name
|
|
|
|
def multipleForms(self):
|
|
return 0
|
|
|
|
class InstructionWithModes(Instruction):
|
|
|
|
def __init__(self, name, mode):
|
|
Instruction.__init__(self, name)
|
|
self.mode = mode
|
|
self.isFloat = (mode == 'd') | (mode == 's')
|
|
if self.isFloat:
|
|
self.isWord = mode != 'd'
|
|
self.asmRegPrefix = ["d", "s"][self.isWord]
|
|
else:
|
|
self.isWord = mode != 'x'
|
|
self.asmRegPrefix = ["x", "w"][self.isWord]
|
|
|
|
def name(self):
|
|
return self._name + (self.mode if self.mode != 'x' else '')
|
|
|
|
def aname(self):
|
|
return (self._name+mode if (mode == 'b' or mode == 'h')
|
|
else self._name)
|
|
|
|
class ThreeRegInstruction(Instruction):
|
|
|
|
def generate(self):
|
|
self.reg = [GeneralRegister().generate(), GeneralRegister().generate(),
|
|
GeneralRegister().generate()]
|
|
return self
|
|
|
|
|
|
def cstr(self):
|
|
return (super(ThreeRegInstruction, self).cstr()
|
|
+ ('%s, %s, %s'
|
|
% (self.reg[0],
|
|
self.reg[1], self.reg[2])))
|
|
|
|
def astr(self):
|
|
prefix = self.asmRegPrefix
|
|
return (super(ThreeRegInstruction, self).astr()
|
|
+ ('%s, %s, %s'
|
|
% (self.reg[0].astr(prefix),
|
|
self.reg[1].astr(prefix), self.reg[2].astr(prefix))))
|
|
|
|
class FourRegInstruction(ThreeRegInstruction):
|
|
|
|
def generate(self):
|
|
self.reg = ThreeRegInstruction.generate(self).reg + [GeneralRegister().generate()]
|
|
return self
|
|
|
|
|
|
def cstr(self):
|
|
return (super(FourRegInstruction, self).cstr()
|
|
+ (', %s' % self.reg[3]))
|
|
|
|
def astr(self):
|
|
prefix = self.asmRegPrefix
|
|
return (super(FourRegInstruction, self).astr()
|
|
+ (', %s' % self.reg[3].astr(prefix)))
|
|
|
|
class TwoRegInstruction(Instruction):
|
|
|
|
def generate(self):
|
|
self.reg = [GeneralRegister().generate(), GeneralRegister().generate()]
|
|
return self
|
|
|
|
def cstr(self):
|
|
return (super(TwoRegInstruction, self).cstr()
|
|
+ '%s, %s' % (self.reg[0],
|
|
self.reg[1]))
|
|
|
|
def astr(self):
|
|
prefix = self.asmRegPrefix
|
|
return (super(TwoRegInstruction, self).astr()
|
|
+ ('%s, %s'
|
|
% (self.reg[0].astr(prefix),
|
|
self.reg[1].astr(prefix))))
|
|
|
|
class TwoRegImmedInstruction(TwoRegInstruction):
|
|
|
|
def generate(self):
|
|
super(TwoRegImmedInstruction, self).generate()
|
|
self.immed = random.randint(0, 1<<11 -1)
|
|
return self
|
|
|
|
def cstr(self):
|
|
return (super(TwoRegImmedInstruction, self).cstr()
|
|
+ ', %su' % self.immed)
|
|
|
|
def astr(self):
|
|
return (super(TwoRegImmedInstruction, self).astr()
|
|
+ ', #%s' % self.immed)
|
|
|
|
class OneRegOp(Instruction):
|
|
|
|
def generate(self):
|
|
self.reg = GeneralRegister().generate()
|
|
return self
|
|
|
|
def cstr(self):
|
|
return (super(OneRegOp, self).cstr()
|
|
+ '%s);' % self.reg)
|
|
|
|
def astr(self):
|
|
return (super(OneRegOp, self).astr()
|
|
+ '%s' % self.reg.astr(self.asmRegPrefix))
|
|
|
|
class PostfixExceptionOneRegOp(OneRegOp):
|
|
|
|
def __init__(self, op):
|
|
OneRegOp.__init__(self, op)
|
|
self.isPostfixException=True
|
|
|
|
class ArithOp(ThreeRegInstruction):
|
|
|
|
def generate(self):
|
|
super(ArithOp, self).generate()
|
|
self.kind = ShiftKind().generate()
|
|
self.distance = random.randint(0, (1<<5)-1 if self.isWord else (1<<6)-1)
|
|
return self
|
|
|
|
def cstr(self):
|
|
return ('%s, Assembler::%s, %s);'
|
|
% (ThreeRegInstruction.cstr(self),
|
|
self.kind.cstr(), self.distance))
|
|
|
|
def astr(self):
|
|
return ('%s, %s #%s'
|
|
% (ThreeRegInstruction.astr(self),
|
|
self.kind.cstr(),
|
|
self.distance))
|
|
|
|
class AddSubCarryOp(ThreeRegInstruction):
|
|
|
|
def cstr(self):
|
|
return ('%s);'
|
|
% (ThreeRegInstruction.cstr(self)))
|
|
|
|
class AddSubExtendedOp(ThreeRegInstruction):
|
|
|
|
uxtb, uxth, uxtw, uxtx, sxtb, sxth, sxtw, sxtx = range(8)
|
|
optNames = ["uxtb", "uxth", "uxtw", "uxtx", "sxtb", "sxth", "sxtw", "sxtx"]
|
|
|
|
def generate(self):
|
|
super(AddSubExtendedOp, self).generate()
|
|
self.amount = random.randint(1, 4)
|
|
self.option = random.randint(0, 7)
|
|
return self
|
|
|
|
def cstr(self):
|
|
return (super(AddSubExtendedOp, self).cstr()
|
|
+ (", ext::" + AddSubExtendedOp.optNames[self.option]
|
|
+ ", " + str(self.amount) + ");"))
|
|
|
|
def astr(self):
|
|
return (super(AddSubExtendedOp, self).astr()
|
|
+ (", " + AddSubExtendedOp.optNames[self.option]
|
|
+ " #" + str(self.amount)))
|
|
|
|
class AddSubImmOp(TwoRegImmedInstruction):
|
|
|
|
def cstr(self):
|
|
return super(AddSubImmOp, self).cstr() + ");"
|
|
|
|
class LogicalImmOp(AddSubImmOp):
|
|
def generate(self):
|
|
AddSubImmOp.generate(self)
|
|
self.immed = \
|
|
immediates32[random.randint(0, len(immediates32)-1)] \
|
|
if self.isWord else \
|
|
immediates64[random.randint(0, len(immediates64)-1)]
|
|
|
|
return self
|
|
|
|
def astr(self):
|
|
return (super(TwoRegImmedInstruction, self).astr()
|
|
+ ', #0x%x' % self.immed)
|
|
|
|
def cstr(self):
|
|
return super(AddSubImmOp, self).cstr() + "ll);"
|
|
|
|
class SVEBinaryImmOp(Instruction):
|
|
def __init__(self, name):
|
|
reg = SVEVectorRegister().generate()
|
|
self.reg = [reg, reg]
|
|
self.numRegs = len(self.reg)
|
|
self._width = RegVariant(0, 3)
|
|
self._isLogical = False
|
|
if name in ["and", "eor", "orr"]:
|
|
self._isLogical = True
|
|
Instruction.__init__(self, name)
|
|
|
|
def generate(self):
|
|
Instruction.generate(self)
|
|
self.immed = random.randint(0, (1<<8)-1)
|
|
if self._isLogical:
|
|
vectype = self._width.cstr()
|
|
if vectype == "__ B":
|
|
self.immed = immediates8[random.randint(0, len(immediates8)-1)]
|
|
elif vectype == "__ H":
|
|
self.immed = immediates16[random.randint(0, len(immediates16)-1)]
|
|
elif vectype == "__ S":
|
|
self.immed = immediates32[random.randint(0, len(immediates32)-1)]
|
|
elif vectype == "__ D":
|
|
self.immed = immediates64[random.randint(0, len(immediates64)-1)]
|
|
return self
|
|
|
|
def cstr(self):
|
|
formatStr = "%s%s, %s, %su);"
|
|
return (formatStr
|
|
% tuple(["__ sve_" + self._name + "("] +
|
|
[str(self.reg[0]), self._width.cstr(), self.immed]))
|
|
|
|
def astr(self):
|
|
formatStr = "%s%s, %s, #0x%x"
|
|
Regs = [str(self.reg[i]) + self._width.astr() for i in range(0, self.numRegs)]
|
|
return (formatStr
|
|
% tuple([Instruction.astr(self)] + Regs + [self.immed]))
|
|
|
|
class SVEComparisonWithZero(Instruction):
|
|
def __init__(self, arg):
|
|
Instruction.__init__(self, "fcm")
|
|
self.condition = arg
|
|
self.dest = OperandFactory.create('p').generate()
|
|
self.reg = SVEVectorRegister().generate()
|
|
self._width = RegVariant(2, 3)
|
|
self.preg = OperandFactory.create('P').generate()
|
|
|
|
def generate(self):
|
|
return Instruction.generate(self)
|
|
|
|
def cstr(self):
|
|
return ("%s(%s, %s, %s, %s, %s, 0.0);"
|
|
% ("__ sve_" + self._name, "Assembler::" + self.condition,
|
|
str(self.dest), self._width.cstr(), str(self.preg), str(self.reg)))
|
|
|
|
def astr(self):
|
|
val = ("%s%s\t%s%s, %s/z, %s%s, #0.0"
|
|
% (self._name, self.condition.lower(), str(self.dest), self._width.astr(),
|
|
str(self.preg), str(self.reg), self._width.astr()))
|
|
return val
|
|
|
|
class MultiOp():
|
|
|
|
def multipleForms(self):
|
|
return 3
|
|
|
|
def forms(self):
|
|
return ["__ pc()", "back", "forth"]
|
|
|
|
def aforms(self):
|
|
return [".", "back", "forth"]
|
|
|
|
class AbsOp(MultiOp, Instruction):
|
|
|
|
def cstr(self):
|
|
return super(AbsOp, self).cstr() + "%s);"
|
|
|
|
def astr(self):
|
|
return Instruction.astr(self) + "%s"
|
|
|
|
class RegAndAbsOp(MultiOp, Instruction):
|
|
|
|
def multipleForms(self):
|
|
if self.name() == "adrp":
|
|
# We can only test one form of adrp because anything other
|
|
# than "adrp ." requires relocs in the assembler output
|
|
return 1
|
|
return 3
|
|
|
|
def generate(self):
|
|
Instruction.generate(self)
|
|
self.reg = GeneralRegister().generate()
|
|
return self
|
|
|
|
def cstr(self):
|
|
if self.name() == "adrp":
|
|
return "__ _adrp(" + "%s, %s);" % (self.reg, "%s")
|
|
return (super(RegAndAbsOp, self).cstr()
|
|
+ "%s, %s);" % (self.reg, "%s"))
|
|
|
|
def astr(self):
|
|
return (super(RegAndAbsOp, self).astr()
|
|
+ self.reg.astr(self.asmRegPrefix) + ", %s")
|
|
|
|
class RegImmAbsOp(RegAndAbsOp):
|
|
|
|
def cstr(self):
|
|
return (Instruction.cstr(self)
|
|
+ "%s, %s, %s);" % (self.reg, self.immed, "%s"))
|
|
|
|
def astr(self):
|
|
return (Instruction.astr(self)
|
|
+ ("%s, #%s, %s"
|
|
% (self.reg.astr(self.asmRegPrefix), self.immed, "%s")))
|
|
|
|
def generate(self):
|
|
super(RegImmAbsOp, self).generate()
|
|
self.immed = random.randint(0, 1<<5 -1)
|
|
return self
|
|
|
|
class MoveWideImmOp(RegImmAbsOp):
|
|
|
|
def multipleForms(self):
|
|
return 0
|
|
|
|
def cstr(self):
|
|
return (Instruction.cstr(self)
|
|
+ "%s, %s, %s);" % (self.reg, self.immed, self.shift))
|
|
|
|
def astr(self):
|
|
return (Instruction.astr(self)
|
|
+ ("%s, #%s, lsl %s"
|
|
% (self.reg.astr(self.asmRegPrefix),
|
|
self.immed, self.shift)))
|
|
|
|
def generate(self):
|
|
super(RegImmAbsOp, self).generate()
|
|
self.immed = random.randint(0, 1<<16 -1)
|
|
if self.isWord:
|
|
self.shift = random.randint(0, 1) * 16
|
|
else:
|
|
self.shift = random.randint(0, 3) * 16
|
|
return self
|
|
|
|
class BitfieldOp(TwoRegInstruction):
|
|
|
|
def cstr(self):
|
|
return (Instruction.cstr(self)
|
|
+ ("%s, %s, %s, %s);"
|
|
% (self.reg[0], self.reg[1], self.immr, self.imms)))
|
|
|
|
def astr(self):
|
|
return (TwoRegInstruction.astr(self)
|
|
+ (", #%s, #%s"
|
|
% (self.immr, self.imms)))
|
|
|
|
def generate(self):
|
|
TwoRegInstruction.generate(self)
|
|
self.immr = random.randint(0, 31)
|
|
self.imms = random.randint(0, 31)
|
|
return self
|
|
|
|
class ExtractOp(ThreeRegInstruction):
|
|
|
|
def generate(self):
|
|
super(ExtractOp, self).generate()
|
|
self.lsb = random.randint(0, (1<<5)-1 if self.isWord else (1<<6)-1)
|
|
return self
|
|
|
|
def cstr(self):
|
|
return (ThreeRegInstruction.cstr(self)
|
|
+ (", %s);" % self.lsb))
|
|
|
|
def astr(self):
|
|
return (ThreeRegInstruction.astr(self)
|
|
+ (", #%s" % self.lsb))
|
|
|
|
class CondBranchOp(MultiOp, Instruction):
|
|
|
|
def cstr(self):
|
|
return "__ br(Assembler::" + self.name() + ", %s);"
|
|
|
|
def astr(self):
|
|
return "b." + self.name() + "\t%s"
|
|
|
|
class ImmOp(Instruction):
|
|
|
|
def cstr(self):
|
|
return "%s%s);" % (Instruction.cstr(self), self.immed)
|
|
|
|
def astr(self):
|
|
return Instruction.astr(self) + "#" + str(self.immed)
|
|
|
|
def generate(self):
|
|
self.immed = random.randint(0, 1<<16 -1)
|
|
return self
|
|
|
|
class Op(Instruction):
|
|
|
|
def cstr(self):
|
|
return Instruction.cstr(self) + ");"
|
|
def astr(self):
|
|
return self.aname();
|
|
|
|
|
|
class PostfixExceptionOp(Op):
|
|
|
|
def __init__(self, op):
|
|
Op.__init__(self, op)
|
|
self.isPostfixException=True
|
|
|
|
class SystemOp(Instruction):
|
|
|
|
def __init__(self, op):
|
|
Instruction.__init__(self, op[0])
|
|
self.barriers = op[1]
|
|
|
|
def generate(self):
|
|
Instruction.generate(self)
|
|
self.barrier \
|
|
= self.barriers[random.randint(0, len(self.barriers)-1)]
|
|
return self
|
|
|
|
def cstr(self):
|
|
return Instruction.cstr(self) + "Assembler::" + self.barrier + ");"
|
|
|
|
def astr(self):
|
|
return Instruction.astr(self) + self.barrier
|
|
|
|
conditionCodes = ["EQ", "NE", "HS", "CS", "LO", "CC", "MI", "PL", "VS", \
|
|
"VC", "HI", "LS", "GE", "LT", "GT", "LE", "AL", "NV"]
|
|
|
|
class ConditionalCompareOp(TwoRegImmedInstruction):
|
|
|
|
def generate(self):
|
|
TwoRegImmedInstruction.generate(self)
|
|
self.cond = random.randint(0, 15)
|
|
self.immed = random.randint(0, 15)
|
|
return self
|
|
|
|
def cstr(self):
|
|
return (super(ConditionalCompareOp, self).cstr() + ", "
|
|
+ "Assembler::" + conditionCodes[self.cond] + ");")
|
|
|
|
def astr(self):
|
|
return (super(ConditionalCompareOp, self).astr() +
|
|
", " + conditionCodes[self.cond])
|
|
|
|
class ConditionalCompareImmedOp(Instruction):
|
|
|
|
def generate(self):
|
|
self.reg = GeneralRegister().generate()
|
|
self.cond = random.randint(0, 15)
|
|
self.immed2 = random.randint(0, 15)
|
|
self.immed = random.randint(0, 31)
|
|
return self
|
|
|
|
def cstr(self):
|
|
return (Instruction.cstr(self) + str(self.reg) + ", "
|
|
+ str(self.immed) + ", "
|
|
+ str(self.immed2) + ", "
|
|
+ "Assembler::" + conditionCodes[self.cond] + ");")
|
|
|
|
def astr(self):
|
|
return (Instruction.astr(self)
|
|
+ self.reg.astr(self.asmRegPrefix)
|
|
+ ", #" + str(self.immed)
|
|
+ ", #" + str(self.immed2)
|
|
+ ", " + conditionCodes[self.cond])
|
|
|
|
class TwoRegOp(TwoRegInstruction):
|
|
|
|
def cstr(self):
|
|
return TwoRegInstruction.cstr(self) + ");"
|
|
|
|
class ThreeRegOp(ThreeRegInstruction):
|
|
|
|
def cstr(self):
|
|
return ThreeRegInstruction.cstr(self) + ");"
|
|
|
|
class FourRegMulOp(FourRegInstruction):
|
|
|
|
def cstr(self):
|
|
return FourRegInstruction.cstr(self) + ");"
|
|
|
|
def astr(self):
|
|
isMaddsub = self.name().startswith("madd") | self.name().startswith("msub")
|
|
midPrefix = self.asmRegPrefix if isMaddsub else "w"
|
|
return (Instruction.astr(self)
|
|
+ self.reg[0].astr(self.asmRegPrefix)
|
|
+ ", " + self.reg[1].astr(midPrefix)
|
|
+ ", " + self.reg[2].astr(midPrefix)
|
|
+ ", " + self.reg[3].astr(self.asmRegPrefix))
|
|
|
|
class ConditionalSelectOp(ThreeRegInstruction):
|
|
|
|
def generate(self):
|
|
ThreeRegInstruction.generate(self)
|
|
self.cond = random.randint(0, 15)
|
|
return self
|
|
|
|
def cstr(self):
|
|
return (ThreeRegInstruction.cstr(self) + ", "
|
|
+ "Assembler::" + conditionCodes[self.cond] + ");")
|
|
|
|
def astr(self):
|
|
return (ThreeRegInstruction.astr(self)
|
|
+ ", " + conditionCodes[self.cond])
|
|
|
|
class LoadStoreExclusiveOp(InstructionWithModes):
|
|
|
|
def __init__(self, op): # op is a tuple of ["name", "mode", registers]
|
|
InstructionWithModes.__init__(self, op[0], op[1])
|
|
self.num_registers = op[2]
|
|
|
|
def astr(self):
|
|
result = self.aname() + '\t'
|
|
regs = list(self.regs)
|
|
index = regs.pop() # The last reg is the index register
|
|
prefix = ('x' if (self.mode == 'x')
|
|
& ((self.name().startswith("ld"))
|
|
| (self.name().startswith("stlr"))) # Ewww :-(
|
|
else 'w')
|
|
result = result + regs.pop(0).astr(prefix) + ", "
|
|
for s in regs:
|
|
result = result + s.astr(self.asmRegPrefix) + ", "
|
|
result = result + "[" + index.astr("x") + "]"
|
|
return result
|
|
|
|
def cstr(self):
|
|
result = InstructionWithModes.cstr(self)
|
|
regs = list(self.regs)
|
|
index = regs.pop() # The last reg is the index register
|
|
for s in regs:
|
|
result = result + str(s) + ", "
|
|
result = result + str(index) + ");"
|
|
return result
|
|
|
|
def appendUniqueReg(self):
|
|
result = 0
|
|
while result == 0:
|
|
newReg = GeneralRegister().generate()
|
|
result = 1
|
|
for i in self.regs:
|
|
result = result and (i.number != newReg.number)
|
|
self.regs.append(newReg)
|
|
|
|
def generate(self):
|
|
self.regs = []
|
|
for i in range(self.num_registers):
|
|
self.appendUniqueReg()
|
|
return self
|
|
|
|
def name(self):
|
|
if self.mode == 'x':
|
|
return self._name
|
|
else:
|
|
return self._name + self.mode
|
|
|
|
def aname(self):
|
|
if (self.mode == 'b') | (self.mode == 'h'):
|
|
return self._name + self.mode
|
|
else:
|
|
return self._name
|
|
|
|
class Address(object):
|
|
|
|
base_plus_unscaled_offset, pre, post, base_plus_reg, \
|
|
base_plus_scaled_offset, pcrel, post_reg, base_only = range(8)
|
|
kinds = ["base_plus_unscaled_offset", "pre", "post", "base_plus_reg",
|
|
"base_plus_scaled_offset", "pcrel", "post_reg", "base_only"]
|
|
extend_kinds = ["uxtw", "lsl", "sxtw", "sxtx"]
|
|
|
|
@classmethod
|
|
def kindToStr(cls, i):
|
|
return cls.kinds[i]
|
|
|
|
def generate(self, kind, shift_distance):
|
|
self.kind = kind
|
|
self.base = GeneralRegister().generate()
|
|
self.index = GeneralRegister().generate()
|
|
self.offset = {
|
|
Address.base_plus_unscaled_offset: random.randint(-1<<8, 1<<8-1) | 1,
|
|
Address.pre: random.randint(-1<<8, 1<<8-1),
|
|
Address.post: random.randint(-1<<8, 1<<8-1),
|
|
Address.pcrel: random.randint(0, 2),
|
|
Address.base_plus_reg: 0,
|
|
Address.base_plus_scaled_offset: (random.randint(0, 1<<11-1) | (3 << 9))*8,
|
|
Address.post_reg: 0,
|
|
Address.base_only: 0} [kind]
|
|
self.offset >>= (3 - shift_distance)
|
|
self.extend_kind = Address.extend_kinds[random.randint(0, 3)]
|
|
self.shift_distance = random.randint(0, 1) * shift_distance
|
|
return self
|
|
|
|
def __str__(self):
|
|
result = {
|
|
Address.base_plus_unscaled_offset: "Address(%s, %s)" \
|
|
% (str(self.base), self.offset),
|
|
Address.pre: "Address(__ pre(%s, %s))" % (str(self.base), self.offset),
|
|
Address.post: "Address(__ post(%s, %s))" % (str(self.base), self.offset),
|
|
Address.post_reg: "Address(__ post(%s, %s))" % (str(self.base), self.index),
|
|
Address.base_only: "Address(%s)" % (str(self.base)),
|
|
Address.pcrel: "",
|
|
Address.base_plus_reg: "Address(%s, %s, Address::%s(%s))" \
|
|
% (self.base, self.index, self.extend_kind, self.shift_distance),
|
|
Address.base_plus_scaled_offset:
|
|
"Address(%s, %s)" % (self.base, self.offset) } [self.kind]
|
|
if (self.kind == Address.pcrel):
|
|
result = ["__ pc()", "back", "forth"][self.offset]
|
|
return result
|
|
|
|
def astr(self, prefix):
|
|
extend_prefix = prefix
|
|
if self.kind == Address.base_plus_reg:
|
|
if self.extend_kind.endswith("w"):
|
|
extend_prefix = "w"
|
|
result = {
|
|
Address.base_plus_unscaled_offset: "[%s, %s]" \
|
|
% (self.base.astr(prefix), self.offset),
|
|
Address.pre: "[%s, %s]!" % (self.base.astr(prefix), self.offset),
|
|
Address.post: "[%s], %s" % (self.base.astr(prefix), self.offset),
|
|
Address.post_reg: "[%s], %s" % (self.base.astr(prefix), self.index.astr(prefix)),
|
|
Address.base_only: "[%s]" % (self.base.astr(prefix)),
|
|
Address.pcrel: "",
|
|
Address.base_plus_reg: "[%s, %s, %s #%s]" \
|
|
% (self.base.astr(prefix), self.index.astr(extend_prefix),
|
|
self.extend_kind, self.shift_distance),
|
|
Address.base_plus_scaled_offset: \
|
|
"[%s, %s]" \
|
|
% (self.base.astr(prefix), self.offset)
|
|
} [self.kind]
|
|
if (self.kind == Address.pcrel):
|
|
result = [".", "back", "forth"][self.offset]
|
|
return result
|
|
|
|
class LoadStoreOp(InstructionWithModes):
|
|
|
|
def __init__(self, args):
|
|
name, self.asmname, self.kind, mode = args
|
|
InstructionWithModes.__init__(self, name, mode)
|
|
|
|
def generate(self):
|
|
|
|
# This is something of a kludge, but the offset needs to be
|
|
# scaled by the memory datamode somehow.
|
|
shift = 3
|
|
if (self.mode == 'b') | (self.asmname.endswith("b")):
|
|
shift = 0
|
|
elif (self.mode == 'h') | (self.asmname.endswith("h")):
|
|
shift = 1
|
|
elif (self.mode == 'w') | (self.asmname.endswith("w")) \
|
|
| (self.mode == 's') :
|
|
shift = 2
|
|
|
|
self.adr = Address().generate(self.kind, shift)
|
|
|
|
isFloat = (self.mode == 'd') | (self.mode == 's')
|
|
|
|
regMode = FloatRegister if isFloat else GeneralRegister
|
|
self.reg = regMode().generate()
|
|
kindStr = Address.kindToStr(self.kind);
|
|
if (not isFloat) and (kindStr is "pre" or kindStr is "post"):
|
|
(self.reg.number, self.adr.base.number) = random.sample(list(set(range(31)) - set([18])), 2)
|
|
return self
|
|
|
|
def cstr(self):
|
|
if not(self._name.startswith("prfm")):
|
|
return "%s%s, %s);" % (Instruction.cstr(self), str(self.reg), str(self.adr))
|
|
else: # No target register for a prefetch
|
|
return "%s%s);" % (Instruction.cstr(self), str(self.adr))
|
|
|
|
def astr(self):
|
|
if not(self._name.startswith("prfm")):
|
|
return "%s\t%s, %s" % (self.aname(), self.reg.astr(self.asmRegPrefix),
|
|
self.adr.astr("x"))
|
|
else: # No target register for a prefetch
|
|
return "%s %s" % (self.aname(),
|
|
self.adr.astr("x"))
|
|
|
|
def aname(self):
|
|
result = self.asmname
|
|
# if self.kind == Address.base_plus_unscaled_offset:
|
|
# result = result.replace("ld", "ldu", 1)
|
|
# result = result.replace("st", "stu", 1)
|
|
return result
|
|
|
|
class LoadStorePairOp(InstructionWithModes):
|
|
|
|
numRegs = 2
|
|
|
|
def __init__(self, args):
|
|
name, self.asmname, self.kind, mode = args
|
|
InstructionWithModes.__init__(self, name, mode)
|
|
self.offset = random.randint(-1<<4, 1<<4-1) << 4
|
|
|
|
def generate(self):
|
|
self.reg = [OperandFactory.create(self.mode).generate()
|
|
for i in range(self.numRegs)]
|
|
self.base = OperandFactory.create('x').generate()
|
|
kindStr = Address.kindToStr(self.kind);
|
|
if kindStr is "pre" or kindStr is "post":
|
|
if self._name.startswith("ld"):
|
|
(self.reg[0].number, self.reg[1].number, self.base.number) = random.sample(list(set(range(31)) - set([18])), 3)
|
|
if self._name.startswith("st"):
|
|
self.base.number = random.choice(list(set(range(31)) - set([self.reg[0].number, self.reg[1].number, 18])))
|
|
elif self._name.startswith("ld"):
|
|
(self.reg[0].number, self.reg[1].number) = random.sample(list(set(range(31)) - set([18])), 2)
|
|
return self
|
|
|
|
def astr(self):
|
|
address = ["[%s, #%s]", "[%s, #%s]!", "[%s], #%s"][self.kind]
|
|
address = address % (self.base.astr('x'), self.offset)
|
|
result = "%s\t%s, %s, %s" \
|
|
% (self.asmname,
|
|
self.reg[0].astr(self.asmRegPrefix),
|
|
self.reg[1].astr(self.asmRegPrefix), address)
|
|
return result
|
|
|
|
def cstr(self):
|
|
address = {
|
|
Address.base_plus_unscaled_offset: "Address(%s, %s)" \
|
|
% (str(self.base), self.offset),
|
|
Address.pre: "Address(__ pre(%s, %s))" % (str(self.base), self.offset),
|
|
Address.post: "Address(__ post(%s, %s))" % (str(self.base), self.offset),
|
|
} [self.kind]
|
|
result = "__ %s(%s, %s, %s);" \
|
|
% (self.name(), self.reg[0], self.reg[1], address)
|
|
return result
|
|
|
|
class FloatInstruction(Instruction):
|
|
|
|
def aname(self):
|
|
if (self._name.endswith("s") | self._name.endswith("d")):
|
|
return self._name[:len(self._name)-1]
|
|
else:
|
|
return self._name
|
|
|
|
def __init__(self, args):
|
|
name, self.modes = args
|
|
Instruction.__init__(self, name)
|
|
|
|
def generate(self):
|
|
self.reg = [OperandFactory.create(self.modes[i]).generate()
|
|
for i in range(self.numRegs)]
|
|
return self
|
|
|
|
def cstr(self):
|
|
formatStr = "%s%s" + ''.join([", %s" for i in range(1, self.numRegs)] + [");"])
|
|
return (formatStr
|
|
% tuple([Instruction.cstr(self)] +
|
|
[str(self.reg[i]) for i in range(self.numRegs)])) # Yowza
|
|
|
|
def astr(self):
|
|
formatStr = "%s%s" + ''.join([", %s" for i in range(1, self.numRegs)])
|
|
return (formatStr
|
|
% tuple([Instruction.astr(self)] +
|
|
[(self.reg[i].astr(self.modes[i])) for i in range(self.numRegs)]))
|
|
|
|
class SVEVectorOp(Instruction):
|
|
def __init__(self, args):
|
|
name = args[0]
|
|
regTypes = args[1]
|
|
regs = []
|
|
for c in regTypes:
|
|
regs.append(OperandFactory.create(c).generate())
|
|
self.reg = regs
|
|
self.numRegs = len(regs)
|
|
if regTypes[0] != "p" and regTypes[1] == 'P':
|
|
self._isPredicated = True
|
|
assert len(args) > 2, "Must specify predicate type"
|
|
for arg in args[2:]:
|
|
if arg == 'm':
|
|
self._merge = "/m"
|
|
elif arg == 'z':
|
|
self._merge = "/z"
|
|
else:
|
|
assert arg == "dn", "Unknown predicate type"
|
|
else:
|
|
self._isPredicated = False
|
|
self._merge = ""
|
|
|
|
self._bitwiseop = False
|
|
if name[0] == 'f':
|
|
self._width = RegVariant(2, 3)
|
|
elif not self._isPredicated and (name in ["and", "eor", "orr", "bic"]):
|
|
self._width = RegVariant(3, 3)
|
|
self._bitwiseop = True
|
|
else:
|
|
self._width = RegVariant(0, 3)
|
|
|
|
self._dnm = None
|
|
if len(args) > 2:
|
|
for arg in args[2:]:
|
|
if arg == "dn":
|
|
self._dnm = arg
|
|
|
|
Instruction.__init__(self, name)
|
|
|
|
def cstr(self):
|
|
formatStr = "%s%s" + ''.join([", %s" for i in range(0, self.numRegs)] + [");"])
|
|
if self._bitwiseop:
|
|
width = []
|
|
formatStr = "%s%s" + ''.join([", %s" for i in range(1, self.numRegs)] + [");"])
|
|
else:
|
|
width = [self._width.cstr()]
|
|
return (formatStr
|
|
% tuple(["__ sve_" + self._name + "("] +
|
|
[str(self.reg[0])] +
|
|
width +
|
|
[str(self.reg[i]) for i in range(1, self.numRegs)]))
|
|
def astr(self):
|
|
formatStr = "%s%s" + ''.join([", %s" for i in range(1, self.numRegs)])
|
|
if self._dnm == 'dn':
|
|
formatStr += ", %s"
|
|
dnReg = [str(self.reg[0]) + self._width.astr()]
|
|
else:
|
|
dnReg = []
|
|
|
|
if self._isPredicated:
|
|
restRegs = [str(self.reg[1]) + self._merge] + dnReg + [str(self.reg[i]) + self._width.astr() for i in range(2, self.numRegs)]
|
|
else:
|
|
restRegs = dnReg + [str(self.reg[i]) + self._width.astr() for i in range(1, self.numRegs)]
|
|
return (formatStr
|
|
% tuple([Instruction.astr(self)] +
|
|
[str(self.reg[0]) + self._width.astr()] +
|
|
restRegs))
|
|
def generate(self):
|
|
return self
|
|
|
|
class SVEReductionOp(Instruction):
|
|
def __init__(self, args):
|
|
name = args[0]
|
|
lowRegType = args[1]
|
|
self.reg = []
|
|
Instruction.__init__(self, name)
|
|
self.reg.append(OperandFactory.create('s').generate())
|
|
self.reg.append(OperandFactory.create('P').generate())
|
|
self.reg.append(OperandFactory.create('Z').generate())
|
|
self._width = RegVariant(lowRegType, 3)
|
|
def cstr(self):
|
|
return "__ sve_%s(%s, %s, %s, %s);" % (self.name(),
|
|
str(self.reg[0]),
|
|
self._width.cstr(),
|
|
str(self.reg[1]),
|
|
str(self.reg[2]))
|
|
def astr(self):
|
|
if self.name() == "uaddv":
|
|
dstRegName = "d" + str(self.reg[0].number)
|
|
else:
|
|
dstRegName = self._width.astr()[1] + str(self.reg[0].number)
|
|
formatStr = "%s %s, %s, %s"
|
|
if self.name() == "fadda":
|
|
formatStr += ", %s"
|
|
moreReg = [dstRegName]
|
|
else:
|
|
moreReg = []
|
|
return formatStr % tuple([self.name()] +
|
|
[dstRegName] +
|
|
[str(self.reg[1])] +
|
|
moreReg +
|
|
[str(self.reg[2]) + self._width.astr()])
|
|
|
|
class LdStNEONOp(Instruction):
|
|
def __init__(self, args):
|
|
self._name, self.regnum, self.arrangement, self.addresskind = args
|
|
|
|
def generate(self):
|
|
self.address = Address().generate(self.addresskind, 0)
|
|
self._firstSIMDreg = FloatRegister().generate()
|
|
if (self.addresskind == Address.post):
|
|
if (self._name in ["ld1r", "ld2r", "ld3r", "ld4r"]):
|
|
elem_size = {"8B" : 1, "16B" : 1, "4H" : 2, "8H" : 2, "2S" : 4, "4S" : 4, "1D" : 8, "2D" : 8} [self.arrangement]
|
|
self.address.offset = self.regnum * elem_size
|
|
else:
|
|
if (self.arrangement in ["8B", "4H", "2S", "1D"]):
|
|
self.address.offset = self.regnum * 8
|
|
else:
|
|
self.address.offset = self.regnum * 16
|
|
return self
|
|
|
|
def cstr(self):
|
|
buf = super(LdStNEONOp, self).cstr() + str(self._firstSIMDreg)
|
|
current = self._firstSIMDreg
|
|
for cnt in range(1, self.regnum):
|
|
buf = '%s, %s' % (buf, current.nextReg())
|
|
current = current.nextReg()
|
|
return '%s, __ T%s, %s);' % (buf, self.arrangement, str(self.address))
|
|
|
|
def astr(self):
|
|
buf = '%s\t{%s.%s' % (self._name, self._firstSIMDreg, self.arrangement)
|
|
current = self._firstSIMDreg
|
|
for cnt in range(1, self.regnum):
|
|
buf = '%s, %s.%s' % (buf, current.nextReg(), self.arrangement)
|
|
current = current.nextReg()
|
|
return '%s}, %s' % (buf, self.address.astr("x"))
|
|
|
|
def aname(self):
|
|
return self._name
|
|
|
|
class NEONReduceInstruction(Instruction):
|
|
def __init__(self, args):
|
|
self._name, self.insname, self.arrangement = args
|
|
|
|
def generate(self):
|
|
current = FloatRegister().generate()
|
|
self.dstSIMDreg = current
|
|
self.srcSIMDreg = current.nextReg()
|
|
return self
|
|
|
|
def cstr(self):
|
|
buf = Instruction.cstr(self) + str(self.dstSIMDreg)
|
|
if self._name == "fmaxp" or self._name == "fminp":
|
|
buf = '%s, %s, __ %s);' % (buf, self.srcSIMDreg, self.arrangement[1:])
|
|
else:
|
|
buf = '%s, __ T%s, %s);' % (buf, self.arrangement, self.srcSIMDreg)
|
|
return buf
|
|
|
|
def astr(self):
|
|
buf = '%s\t%s' % (self.insname, self.dstSIMDreg.astr(self.arrangement[-1].lower()))
|
|
buf = '%s, %s.%s' % (buf, self.srcSIMDreg, self.arrangement)
|
|
return buf
|
|
|
|
def aname(self):
|
|
return self._name
|
|
|
|
class CommonNEONInstruction(Instruction):
|
|
def __init__(self, args):
|
|
self._name, self.insname, self.arrangement = args
|
|
|
|
def generate(self):
|
|
self._firstSIMDreg = FloatRegister().generate()
|
|
return self
|
|
|
|
def cstr(self):
|
|
buf = Instruction.cstr(self) + str(self._firstSIMDreg)
|
|
buf = '%s, __ T%s' % (buf, self.arrangement)
|
|
current = self._firstSIMDreg
|
|
for cnt in range(1, self.numRegs):
|
|
buf = '%s, %s' % (buf, current.nextReg())
|
|
current = current.nextReg()
|
|
return '%s);' % (buf)
|
|
|
|
def astr(self):
|
|
buf = '%s\t%s.%s' % (self.insname, self._firstSIMDreg, self.arrangement)
|
|
current = self._firstSIMDreg
|
|
for cnt in range(1, self.numRegs):
|
|
buf = '%s, %s.%s' % (buf, current.nextReg(), self.arrangement)
|
|
current = current.nextReg()
|
|
return buf
|
|
|
|
def aname(self):
|
|
return self._name
|
|
|
|
class SHA512SIMDOp(Instruction):
|
|
|
|
def generate(self):
|
|
if (self._name == 'sha512su0'):
|
|
self.reg = [FloatRegister().generate(), FloatRegister().generate()]
|
|
else:
|
|
self.reg = [FloatRegister().generate(), FloatRegister().generate(),
|
|
FloatRegister().generate()]
|
|
return self
|
|
|
|
def cstr(self):
|
|
if (self._name == 'sha512su0'):
|
|
return (super(SHA512SIMDOp, self).cstr()
|
|
+ ('%s, __ T2D, %s);' % (self.reg[0], self.reg[1])))
|
|
else:
|
|
return (super(SHA512SIMDOp, self).cstr()
|
|
+ ('%s, __ T2D, %s, %s);' % (self.reg[0], self.reg[1], self.reg[2])))
|
|
|
|
def astr(self):
|
|
if (self._name == 'sha512su0'):
|
|
return (super(SHA512SIMDOp, self).astr()
|
|
+ ('\t%s.2D, %s.2D' % (self.reg[0].astr("v"), self.reg[1].astr("v"))))
|
|
elif (self._name == 'sha512su1'):
|
|
return (super(SHA512SIMDOp, self).astr()
|
|
+ ('\t%s.2D, %s.2D, %s.2D' % (self.reg[0].astr("v"),
|
|
self.reg[1].astr("v"), self.reg[2].astr("v"))))
|
|
else:
|
|
return (super(SHA512SIMDOp, self).astr()
|
|
+ ('\t%s, %s, %s.2D' % (self.reg[0].astr("q"),
|
|
self.reg[1].astr("q"), self.reg[2].astr("v"))))
|
|
|
|
class SHA3SIMDOp(Instruction):
|
|
|
|
def generate(self):
|
|
if ((self._name == 'eor3') or (self._name == 'bcax')):
|
|
self.reg = [FloatRegister().generate(), FloatRegister().generate(),
|
|
FloatRegister().generate(), FloatRegister().generate()]
|
|
else:
|
|
self.reg = [FloatRegister().generate(), FloatRegister().generate(),
|
|
FloatRegister().generate()]
|
|
if (self._name == 'xar'):
|
|
self.imm6 = random.randint(0, 63)
|
|
return self
|
|
|
|
def cstr(self):
|
|
if ((self._name == 'eor3') or (self._name == 'bcax')):
|
|
return (super(SHA3SIMDOp, self).cstr()
|
|
+ ('%s, __ T16B, %s, %s, %s);' % (self.reg[0], self.reg[1], self.reg[2], self.reg[3])))
|
|
elif (self._name == 'rax1'):
|
|
return (super(SHA3SIMDOp, self).cstr()
|
|
+ ('%s, __ T2D, %s, %s);' % (self.reg[0], self.reg[1], self.reg[2])))
|
|
else:
|
|
return (super(SHA3SIMDOp, self).cstr()
|
|
+ ('%s, __ T2D, %s, %s, %s);' % (self.reg[0], self.reg[1], self.reg[2], self.imm6)))
|
|
|
|
def astr(self):
|
|
if ((self._name == 'eor3') or (self._name == 'bcax')):
|
|
return (super(SHA3SIMDOp, self).astr()
|
|
+ ('\t%s.16B, %s.16B, %s.16B, %s.16B' % (self.reg[0].astr("v"), self.reg[1].astr("v"),
|
|
self.reg[2].astr("v"), self.reg[3].astr("v"))))
|
|
elif (self._name == 'rax1'):
|
|
return (super(SHA3SIMDOp, self).astr()
|
|
+ ('\t%s.2D, %s.2D, %s.2D') % (self.reg[0].astr("v"), self.reg[1].astr("v"),
|
|
self.reg[2].astr("v")))
|
|
else:
|
|
return (super(SHA3SIMDOp, self).astr()
|
|
+ ('\t%s.2D, %s.2D, %s.2D, #%s') % (self.reg[0].astr("v"), self.reg[1].astr("v"),
|
|
self.reg[2].astr("v"), self.imm6))
|
|
|
|
class LSEOp(Instruction):
|
|
def __init__(self, args):
|
|
self._name, self.asmname, self.size, self.suffix = args
|
|
|
|
def generate(self):
|
|
self._name = "%s%s" % (self._name, self.suffix)
|
|
self.asmname = "%s%s" % (self.asmname, self.suffix)
|
|
self.srcReg = GeneralRegisterOrZr().generate()
|
|
self.tgtReg = GeneralRegisterOrZr().generate()
|
|
self.adrReg = GeneralRegisterOrSp().generate()
|
|
|
|
return self
|
|
|
|
def cstr(self):
|
|
sizeSpec = {"x" : "Assembler::xword", "w" : "Assembler::word"} [self.size]
|
|
return super(LSEOp, self).cstr() + "%s, %s, %s, %s);" % (sizeSpec, self.srcReg, self.tgtReg, self.adrReg)
|
|
|
|
def astr(self):
|
|
return "%s\t%s, %s, [%s]" % (self.asmname, self.srcReg.astr(self.size), self.tgtReg.astr(self.size), self.adrReg.astr("x"))
|
|
|
|
def aname(self):
|
|
return self.asmname
|
|
|
|
class TwoRegFloatOp(FloatInstruction):
|
|
numRegs = 2
|
|
|
|
class ThreeRegFloatOp(TwoRegFloatOp):
|
|
numRegs = 3
|
|
|
|
class FourRegFloatOp(TwoRegFloatOp):
|
|
numRegs = 4
|
|
|
|
class FloatConvertOp(TwoRegFloatOp):
|
|
|
|
def __init__(self, args):
|
|
self._cname, self._aname, modes = args
|
|
TwoRegFloatOp.__init__(self, [self._cname, modes])
|
|
|
|
def aname(self):
|
|
return self._aname
|
|
|
|
def cname(self):
|
|
return self._cname
|
|
|
|
class TwoRegNEONOp(CommonNEONInstruction):
|
|
numRegs = 2
|
|
|
|
class ThreeRegNEONOp(TwoRegNEONOp):
|
|
numRegs = 3
|
|
|
|
class SpecialCases(Instruction):
|
|
def __init__(self, data):
|
|
self._name = data[0]
|
|
self._cstr = data[1]
|
|
self._astr = data[2]
|
|
|
|
def cstr(self):
|
|
return self._cstr
|
|
|
|
def astr(self):
|
|
return self._astr
|
|
|
|
def generate(kind, names):
|
|
outfile.write("# " + kind.__name__ + "\n");
|
|
print "\n// " + kind.__name__
|
|
for name in names:
|
|
for i in range(1):
|
|
op = kind(name).generate()
|
|
if op.multipleForms():
|
|
forms = op.forms()
|
|
aforms = op.aforms()
|
|
for i in range(op.multipleForms()):
|
|
cstr = op.cstr() % forms[i]
|
|
astr = op.astr() % aforms[i]
|
|
print " %-50s //\t%s" % (cstr, astr)
|
|
outfile.write("\t" + astr + "\n")
|
|
else:
|
|
print " %-50s //\t%s" % (op.cstr(), op.astr())
|
|
outfile.write("\t" + op.astr() + "\n")
|
|
|
|
outfile = open("aarch64ops.s", "w")
|
|
|
|
# To minimize the changes of assembler test code
|
|
random.seed(0)
|
|
|
|
print "// BEGIN Generated code -- do not edit"
|
|
print "// Generated by aarch64-asmtest.py"
|
|
|
|
print " Label back, forth;"
|
|
print " __ bind(back);"
|
|
|
|
outfile.write("back:\n")
|
|
|
|
generate (ArithOp,
|
|
[ "add", "sub", "adds", "subs",
|
|
"addw", "subw", "addsw", "subsw",
|
|
"and", "orr", "eor", "ands",
|
|
"andw", "orrw", "eorw", "andsw",
|
|
"bic", "orn", "eon", "bics",
|
|
"bicw", "ornw", "eonw", "bicsw" ])
|
|
|
|
generate (AddSubImmOp,
|
|
[ "addw", "addsw", "subw", "subsw",
|
|
"add", "adds", "sub", "subs"])
|
|
generate (LogicalImmOp,
|
|
[ "andw", "orrw", "eorw", "andsw",
|
|
"and", "orr", "eor", "ands"])
|
|
|
|
generate (AbsOp, [ "b", "bl" ])
|
|
|
|
generate (RegAndAbsOp, ["cbzw", "cbnzw", "cbz", "cbnz", "adr", "adrp"])
|
|
|
|
generate (RegImmAbsOp, ["tbz", "tbnz"])
|
|
|
|
generate (MoveWideImmOp, ["movnw", "movzw", "movkw", "movn", "movz", "movk"])
|
|
|
|
generate (BitfieldOp, ["sbfm", "bfmw", "ubfmw", "sbfm", "bfm", "ubfm"])
|
|
|
|
generate (ExtractOp, ["extrw", "extr"])
|
|
|
|
generate (CondBranchOp, ["EQ", "NE", "HS", "CS", "LO", "CC", "MI", "PL", "VS", "VC",
|
|
"HI", "LS", "GE", "LT", "GT", "LE", "AL", "NV" ])
|
|
|
|
generate (ImmOp, ["svc", "hvc", "smc", "brk", "hlt", # "dcps1", "dcps2", "dcps3"
|
|
])
|
|
|
|
generate (Op, ["nop", "yield", "wfe", "sev", "sevl",
|
|
"autia1716", "autiasp", "autiaz", "autib1716", "autibsp", "autibz",
|
|
"pacia1716", "paciasp", "paciaz", "pacib1716", "pacibsp", "pacibz",
|
|
"eret", "drps", "isb",])
|
|
|
|
# Ensure the "i" is not stripped off the end of the instruction
|
|
generate (PostfixExceptionOp, ["wfi", "xpaclri"])
|
|
|
|
barriers = ["OSHLD", "OSHST", "OSH", "NSHLD", "NSHST", "NSH",
|
|
"ISHLD", "ISHST", "ISH", "LD", "ST", "SY"]
|
|
|
|
generate (SystemOp, [["dsb", barriers], ["dmb", barriers]])
|
|
|
|
generate (OneRegOp, ["br", "blr",
|
|
"paciza", "pacizb", "pacdza", "pacdzb",
|
|
"autiza", "autizb", "autdza", "autdzb", "xpacd",
|
|
"braaz", "brabz", "blraaz", "blrabz"])
|
|
|
|
# Ensure the "i" is not stripped off the end of the instruction
|
|
generate (PostfixExceptionOneRegOp, ["xpaci"])
|
|
|
|
for mode in 'xwhb':
|
|
generate (LoadStoreExclusiveOp, [["stxr", mode, 3], ["stlxr", mode, 3],
|
|
["ldxr", mode, 2], ["ldaxr", mode, 2],
|
|
["stlr", mode, 2], ["ldar", mode, 2]])
|
|
|
|
for mode in 'xw':
|
|
generate (LoadStoreExclusiveOp, [["ldxp", mode, 3], ["ldaxp", mode, 3],
|
|
["stxp", mode, 4], ["stlxp", mode, 4]])
|
|
|
|
for kind in range(6):
|
|
sys.stdout.write("\n// " + Address.kindToStr(kind))
|
|
if kind != Address.pcrel:
|
|
generate (LoadStoreOp,
|
|
[["str", "str", kind, "x"], ["str", "str", kind, "w"],
|
|
["str", "strb", kind, "b"], ["str", "strh", kind, "h"],
|
|
["ldr", "ldr", kind, "x"], ["ldr", "ldr", kind, "w"],
|
|
["ldr", "ldrb", kind, "b"], ["ldr", "ldrh", kind, "h"],
|
|
["ldrsb", "ldrsb", kind, "x"], ["ldrsh", "ldrsh", kind, "x"],
|
|
["ldrsh", "ldrsh", kind, "w"], ["ldrsw", "ldrsw", kind, "x"],
|
|
["ldr", "ldr", kind, "d"], ["ldr", "ldr", kind, "s"],
|
|
["str", "str", kind, "d"], ["str", "str", kind, "s"],
|
|
])
|
|
else:
|
|
generate (LoadStoreOp,
|
|
[["ldr", "ldr", kind, "x"], ["ldr", "ldr", kind, "w"]])
|
|
|
|
|
|
for kind in (Address.base_plus_unscaled_offset, Address.pcrel, Address.base_plus_reg, \
|
|
Address.base_plus_scaled_offset):
|
|
generate (LoadStoreOp,
|
|
[["prfm", "prfm\tPLDL1KEEP,", kind, "x"]])
|
|
|
|
generate(AddSubCarryOp, ["adcw", "adcsw", "sbcw", "sbcsw", "adc", "adcs", "sbc", "sbcs"])
|
|
|
|
generate(AddSubExtendedOp, ["addw", "addsw", "sub", "subsw", "add", "adds", "sub", "subs"])
|
|
|
|
generate(ConditionalCompareOp, ["ccmnw", "ccmpw", "ccmn", "ccmp"])
|
|
generate(ConditionalCompareImmedOp, ["ccmnw", "ccmpw", "ccmn", "ccmp"])
|
|
generate(ConditionalSelectOp,
|
|
["cselw", "csincw", "csinvw", "csnegw", "csel", "csinc", "csinv", "csneg"])
|
|
|
|
generate(TwoRegOp,
|
|
["rbitw", "rev16w", "revw", "clzw", "clsw", "rbit",
|
|
"rev16", "rev32", "rev", "clz", "cls",
|
|
"pacia", "pacib", "pacda", "pacdb", "autia", "autib", "autda", "autdb",
|
|
"braa", "brab", "blraa", "blrab"])
|
|
|
|
generate(ThreeRegOp,
|
|
["udivw", "sdivw", "lslvw", "lsrvw", "asrvw", "rorvw", "udiv", "sdiv",
|
|
"lslv", "lsrv", "asrv", "rorv", "umulh", "smulh"])
|
|
generate(FourRegMulOp,
|
|
["maddw", "msubw", "madd", "msub", "smaddl", "smsubl", "umaddl", "umsubl"])
|
|
|
|
generate(ThreeRegFloatOp,
|
|
[["fabds", "sss"], ["fmuls", "sss"], ["fdivs", "sss"], ["fadds", "sss"], ["fsubs", "sss"],
|
|
["fabdd", "ddd"], ["fmuld", "ddd"], ["fdivd", "ddd"], ["faddd", "ddd"], ["fsubd", "ddd"],
|
|
])
|
|
|
|
generate(FourRegFloatOp,
|
|
[["fmadds", "ssss"], ["fmsubs", "ssss"], ["fnmadds", "ssss"], ["fnmadds", "ssss"],
|
|
["fmaddd", "dddd"], ["fmsubd", "dddd"], ["fnmaddd", "dddd"], ["fnmaddd", "dddd"],])
|
|
|
|
generate(TwoRegFloatOp,
|
|
[["fmovs", "ss"], ["fabss", "ss"], ["fnegs", "ss"], ["fsqrts", "ss"],
|
|
["fcvts", "ds"],
|
|
["fmovd", "dd"], ["fabsd", "dd"], ["fnegd", "dd"], ["fsqrtd", "dd"],
|
|
["fcvtd", "sd"],
|
|
])
|
|
|
|
generate(FloatConvertOp, [["fcvtzsw", "fcvtzs", "ws"], ["fcvtzs", "fcvtzs", "xs"],
|
|
["fcvtzdw", "fcvtzs", "wd"], ["fcvtzd", "fcvtzs", "xd"],
|
|
["scvtfws", "scvtf", "sw"], ["scvtfs", "scvtf", "sx"],
|
|
["scvtfwd", "scvtf", "dw"], ["scvtfd", "scvtf", "dx"],
|
|
["fcvtassw", "fcvtas", "ws"], ["fcvtasd", "fcvtas", "xd"],
|
|
["fcvtmssw", "fcvtms", "ws"], ["fcvtmsd", "fcvtms", "xd"],
|
|
["fmovs", "fmov", "ws"], ["fmovd", "fmov", "xd"],
|
|
["fmovs", "fmov", "sw"], ["fmovd", "fmov", "dx"]])
|
|
|
|
generate(TwoRegFloatOp, [["fcmps", "ss"], ["fcmpd", "dd"],
|
|
["fcmps", "sz"], ["fcmpd", "dz"]])
|
|
|
|
for kind in range(3):
|
|
generate(LoadStorePairOp, [["stp", "stp", kind, "w"], ["ldp", "ldp", kind, "w"],
|
|
["ldpsw", "ldpsw", kind, "x"],
|
|
["stp", "stp", kind, "x"], ["ldp", "ldp", kind, "x"]
|
|
])
|
|
generate(LoadStorePairOp, [["stnp", "stnp", 0, "w"], ["ldnp", "ldnp", 0, "w"],
|
|
["stnp", "stnp", 0, "x"], ["ldnp", "ldnp", 0, "x"]])
|
|
|
|
generate(LdStNEONOp, [["ld1", 1, "8B", Address.base_only],
|
|
["ld1", 2, "16B", Address.post],
|
|
["ld1", 3, "1D", Address.post_reg],
|
|
["ld1", 4, "8H", Address.post],
|
|
["ld1r", 1, "8B", Address.base_only],
|
|
["ld1r", 1, "4S", Address.post],
|
|
["ld1r", 1, "1D", Address.post_reg],
|
|
["ld2", 2, "2D", Address.base_only],
|
|
["ld2", 2, "4H", Address.post],
|
|
["ld2r", 2, "16B", Address.base_only],
|
|
["ld2r", 2, "2S", Address.post],
|
|
["ld2r", 2, "2D", Address.post_reg],
|
|
["ld3", 3, "4S", Address.post_reg],
|
|
["ld3", 3, "2S", Address.base_only],
|
|
["ld3r", 3, "8H", Address.base_only],
|
|
["ld3r", 3, "4S", Address.post],
|
|
["ld3r", 3, "1D", Address.post_reg],
|
|
["ld4", 4, "8H", Address.post],
|
|
["ld4", 4, "8B", Address.post_reg],
|
|
["ld4r", 4, "8B", Address.base_only],
|
|
["ld4r", 4, "4H", Address.post],
|
|
["ld4r", 4, "2S", Address.post_reg],
|
|
])
|
|
|
|
generate(NEONReduceInstruction,
|
|
[["addv", "addv", "8B"], ["addv", "addv", "16B"],
|
|
["addv", "addv", "4H"], ["addv", "addv", "8H"],
|
|
["addv", "addv", "4S"],
|
|
["smaxv", "smaxv", "8B"], ["smaxv", "smaxv", "16B"],
|
|
["smaxv", "smaxv", "4H"], ["smaxv", "smaxv", "8H"],
|
|
["smaxv", "smaxv", "4S"], ["fmaxv", "fmaxv", "4S"],
|
|
["sminv", "sminv", "8B"], ["uminv", "uminv", "8B"],
|
|
["sminv", "sminv", "16B"],["uminv", "uminv", "16B"],
|
|
["sminv", "sminv", "4H"], ["uminv", "uminv", "4H"],
|
|
["sminv", "sminv", "8H"], ["uminv", "uminv", "8H"],
|
|
["sminv", "sminv", "4S"], ["uminv", "uminv", "4S"],
|
|
["fminv", "fminv", "4S"],
|
|
["fmaxp", "fmaxp", "2S"], ["fmaxp", "fmaxp", "2D"],
|
|
["fminp", "fminp", "2S"], ["fminp", "fminp", "2D"],
|
|
])
|
|
|
|
generate(TwoRegNEONOp,
|
|
[["absr", "abs", "8B"], ["absr", "abs", "16B"],
|
|
["absr", "abs", "4H"], ["absr", "abs", "8H"],
|
|
["absr", "abs", "2S"], ["absr", "abs", "4S"],
|
|
["absr", "abs", "2D"],
|
|
["fabs", "fabs", "2S"], ["fabs", "fabs", "4S"],
|
|
["fabs", "fabs", "2D"],
|
|
["fneg", "fneg", "2S"], ["fneg", "fneg", "4S"],
|
|
["fneg", "fneg", "2D"],
|
|
["fsqrt", "fsqrt", "2S"], ["fsqrt", "fsqrt", "4S"],
|
|
["fsqrt", "fsqrt", "2D"],
|
|
["notr", "not", "8B"], ["notr", "not", "16B"],
|
|
])
|
|
|
|
generate(ThreeRegNEONOp,
|
|
[["andr", "and", "8B"], ["andr", "and", "16B"],
|
|
["orr", "orr", "8B"], ["orr", "orr", "16B"],
|
|
["eor", "eor", "8B"], ["eor", "eor", "16B"],
|
|
["addv", "add", "8B"], ["addv", "add", "16B"],
|
|
["addv", "add", "4H"], ["addv", "add", "8H"],
|
|
["addv", "add", "2S"], ["addv", "add", "4S"],
|
|
["addv", "add", "2D"],
|
|
["fadd", "fadd", "2S"], ["fadd", "fadd", "4S"],
|
|
["fadd", "fadd", "2D"],
|
|
["subv", "sub", "8B"], ["subv", "sub", "16B"],
|
|
["subv", "sub", "4H"], ["subv", "sub", "8H"],
|
|
["subv", "sub", "2S"], ["subv", "sub", "4S"],
|
|
["subv", "sub", "2D"],
|
|
["fsub", "fsub", "2S"], ["fsub", "fsub", "4S"],
|
|
["fsub", "fsub", "2D"],
|
|
["mulv", "mul", "8B"], ["mulv", "mul", "16B"],
|
|
["mulv", "mul", "4H"], ["mulv", "mul", "8H"],
|
|
["mulv", "mul", "2S"], ["mulv", "mul", "4S"],
|
|
["fabd", "fabd", "2S"], ["fabd", "fabd", "4S"],
|
|
["fabd", "fabd", "2D"],
|
|
["fmul", "fmul", "2S"], ["fmul", "fmul", "4S"],
|
|
["fmul", "fmul", "2D"],
|
|
["mlav", "mla", "4H"], ["mlav", "mla", "8H"],
|
|
["mlav", "mla", "2S"], ["mlav", "mla", "4S"],
|
|
["fmla", "fmla", "2S"], ["fmla", "fmla", "4S"],
|
|
["fmla", "fmla", "2D"],
|
|
["mlsv", "mls", "4H"], ["mlsv", "mls", "8H"],
|
|
["mlsv", "mls", "2S"], ["mlsv", "mls", "4S"],
|
|
["fmls", "fmls", "2S"], ["fmls", "fmls", "4S"],
|
|
["fmls", "fmls", "2D"],
|
|
["fdiv", "fdiv", "2S"], ["fdiv", "fdiv", "4S"],
|
|
["fdiv", "fdiv", "2D"],
|
|
["maxv", "smax", "8B"], ["maxv", "smax", "16B"],
|
|
["maxv", "smax", "4H"], ["maxv", "smax", "8H"],
|
|
["maxv", "smax", "2S"], ["maxv", "smax", "4S"],
|
|
["smaxp", "smaxp", "8B"], ["smaxp", "smaxp", "16B"],
|
|
["smaxp", "smaxp", "4H"], ["smaxp", "smaxp", "8H"],
|
|
["smaxp", "smaxp", "2S"], ["smaxp", "smaxp", "4S"],
|
|
["fmax", "fmax", "2S"], ["fmax", "fmax", "4S"],
|
|
["fmax", "fmax", "2D"],
|
|
["minv", "smin", "8B"], ["minv", "smin", "16B"],
|
|
["minv", "smin", "4H"], ["minv", "smin", "8H"],
|
|
["minv", "smin", "2S"], ["minv", "smin", "4S"],
|
|
["sminp", "sminp", "8B"], ["sminp", "sminp", "16B"],
|
|
["sminp", "sminp", "4H"], ["sminp", "sminp", "8H"],
|
|
["sminp", "sminp", "2S"], ["sminp", "sminp", "4S"],
|
|
["fmin", "fmin", "2S"], ["fmin", "fmin", "4S"],
|
|
["fmin", "fmin", "2D"],
|
|
["cmeq", "cmeq", "8B"], ["cmeq", "cmeq", "16B"],
|
|
["cmeq", "cmeq", "4H"], ["cmeq", "cmeq", "8H"],
|
|
["cmeq", "cmeq", "2S"], ["cmeq", "cmeq", "4S"],
|
|
["cmeq", "cmeq", "2D"],
|
|
["fcmeq", "fcmeq", "2S"], ["fcmeq", "fcmeq", "4S"],
|
|
["fcmeq", "fcmeq", "2D"],
|
|
["cmgt", "cmgt", "8B"], ["cmgt", "cmgt", "16B"],
|
|
["cmgt", "cmgt", "4H"], ["cmgt", "cmgt", "8H"],
|
|
["cmgt", "cmgt", "2S"], ["cmgt", "cmgt", "4S"],
|
|
["cmgt", "cmgt", "2D"],
|
|
["cmhi", "cmhi", "8B"], ["cmhi", "cmhi", "16B"],
|
|
["cmhi", "cmhi", "4H"], ["cmhi", "cmhi", "8H"],
|
|
["cmhi", "cmhi", "2S"], ["cmhi", "cmhi", "4S"],
|
|
["cmhi", "cmhi", "2D"],
|
|
["cmhs", "cmhs", "8B"], ["cmhs", "cmhs", "16B"],
|
|
["cmhs", "cmhs", "4H"], ["cmhs", "cmhs", "8H"],
|
|
["cmhs", "cmhs", "2S"], ["cmhs", "cmhs", "4S"],
|
|
["cmhs", "cmhs", "2D"],
|
|
["fcmgt", "fcmgt", "2S"], ["fcmgt", "fcmgt", "4S"],
|
|
["fcmgt", "fcmgt", "2D"],
|
|
["cmge", "cmge", "8B"], ["cmge", "cmge", "16B"],
|
|
["cmge", "cmge", "4H"], ["cmge", "cmge", "8H"],
|
|
["cmge", "cmge", "2S"], ["cmge", "cmge", "4S"],
|
|
["cmge", "cmge", "2D"],
|
|
["fcmge", "fcmge", "2S"], ["fcmge", "fcmge", "4S"],
|
|
["fcmge", "fcmge", "2D"],
|
|
])
|
|
|
|
generate(SVEComparisonWithZero, ["EQ", "GT", "GE", "LT", "LE", "NE"])
|
|
|
|
generate(SpecialCases, [["ccmn", "__ ccmn(zr, zr, 3u, Assembler::LE);", "ccmn\txzr, xzr, #3, LE"],
|
|
["ccmnw", "__ ccmnw(zr, zr, 5u, Assembler::EQ);", "ccmn\twzr, wzr, #5, EQ"],
|
|
["ccmp", "__ ccmp(zr, 1, 4u, Assembler::NE);", "ccmp\txzr, 1, #4, NE"],
|
|
["ccmpw", "__ ccmpw(zr, 2, 2, Assembler::GT);", "ccmp\twzr, 2, #2, GT"],
|
|
["extr", "__ extr(zr, zr, zr, 0);", "extr\txzr, xzr, xzr, 0"],
|
|
["stlxp", "__ stlxp(r0, zr, zr, sp);", "stlxp\tw0, xzr, xzr, [sp]"],
|
|
["stlxpw", "__ stlxpw(r2, zr, zr, r3);", "stlxp\tw2, wzr, wzr, [x3]"],
|
|
["stxp", "__ stxp(r4, zr, zr, r5);", "stxp\tw4, xzr, xzr, [x5]"],
|
|
["stxpw", "__ stxpw(r6, zr, zr, sp);", "stxp\tw6, wzr, wzr, [sp]"],
|
|
["dup", "__ dup(v0, __ T16B, zr);", "dup\tv0.16b, wzr"],
|
|
["dup", "__ dup(v0, __ S, v1);", "dup\ts0, v1.s[0]"],
|
|
["mov", "__ mov(v1, __ D, 0, zr);", "mov\tv1.d[0], xzr"],
|
|
["mov", "__ mov(v1, __ S, 1, zr);", "mov\tv1.s[1], wzr"],
|
|
["mov", "__ mov(v1, __ H, 2, zr);", "mov\tv1.h[2], wzr"],
|
|
["mov", "__ mov(v1, __ B, 3, zr);", "mov\tv1.b[3], wzr"],
|
|
["smov", "__ smov(r0, v1, __ S, 0);", "smov\tx0, v1.s[0]"],
|
|
["smov", "__ smov(r0, v1, __ H, 1);", "smov\tx0, v1.h[1]"],
|
|
["smov", "__ smov(r0, v1, __ B, 2);", "smov\tx0, v1.b[2]"],
|
|
["umov", "__ umov(r0, v1, __ D, 0);", "umov\tx0, v1.d[0]"],
|
|
["umov", "__ umov(r0, v1, __ S, 1);", "umov\tw0, v1.s[1]"],
|
|
["umov", "__ umov(r0, v1, __ H, 2);", "umov\tw0, v1.h[2]"],
|
|
["umov", "__ umov(r0, v1, __ B, 3);", "umov\tw0, v1.b[3]"],
|
|
["fmov", "__ fmovhid(r0, v1);", "fmov\tx0, v1.d[1]"],
|
|
["fmov", "__ fmovs(v9, __ T2S, 0.5f);", "fmov\tv9.2s, 0.5"],
|
|
["fmov", "__ fmovd(v14, __ T2D, 0.5f);", "fmov\tv14.2d, 0.5"],
|
|
["ld1", "__ ld1(v31, v0, __ T2D, Address(__ post(r1, r0)));", "ld1\t{v31.2d, v0.2d}, [x1], x0"],
|
|
["fcvtzs", "__ fcvtzs(v0, __ T2S, v1);", "fcvtzs\tv0.2s, v1.2s"],
|
|
["fcvtas", "__ fcvtas(v2, __ T4S, v3);", "fcvtas\tv2.4s, v3.4s"],
|
|
["fcvtms", "__ fcvtms(v4, __ T2D, v5);", "fcvtms\tv4.2d, v5.2d"],
|
|
# SVE instructions
|
|
["cpy", "__ sve_cpy(z0, __ S, p0, v1);", "mov\tz0.s, p0/m, s1"],
|
|
["cpy", "__ sve_cpy(z0, __ B, p0, 127, true);", "mov\tz0.b, p0/m, 127"],
|
|
["cpy", "__ sve_cpy(z1, __ H, p0, -128, true);", "mov\tz1.h, p0/m, -128"],
|
|
["cpy", "__ sve_cpy(z2, __ S, p0, 32512, true);", "mov\tz2.s, p0/m, 32512"],
|
|
["cpy", "__ sve_cpy(z5, __ D, p0, -32768, false);", "mov\tz5.d, p0/z, -32768"],
|
|
["cpy", "__ sve_cpy(z10, __ B, p0, -1, false);", "mov\tz10.b, p0/z, -1"],
|
|
["cpy", "__ sve_cpy(z11, __ S, p0, -1, false);", "mov\tz11.s, p0/z, -1"],
|
|
["inc", "__ sve_inc(r0, __ S);", "incw\tx0"],
|
|
["dec", "__ sve_dec(r1, __ H);", "dech\tx1"],
|
|
["lsl", "__ sve_lsl(z0, __ B, z1, 7);", "lsl\tz0.b, z1.b, #7"],
|
|
["lsl", "__ sve_lsl(z21, __ H, z1, 15);", "lsl\tz21.h, z1.h, #15"],
|
|
["lsl", "__ sve_lsl(z0, __ S, z1, 31);", "lsl\tz0.s, z1.s, #31"],
|
|
["lsl", "__ sve_lsl(z0, __ D, z1, 63);", "lsl\tz0.d, z1.d, #63"],
|
|
["lsr", "__ sve_lsr(z0, __ B, z1, 7);", "lsr\tz0.b, z1.b, #7"],
|
|
["asr", "__ sve_asr(z0, __ H, z11, 15);", "asr\tz0.h, z11.h, #15"],
|
|
["lsr", "__ sve_lsr(z30, __ S, z1, 31);", "lsr\tz30.s, z1.s, #31"],
|
|
["asr", "__ sve_asr(z0, __ D, z1, 63);", "asr\tz0.d, z1.d, #63"],
|
|
["lsl", "__ sve_lsl(z0, __ B, p0, 0);", "lsl\tz0.b, p0/m, z0.b, #0"],
|
|
["lsl", "__ sve_lsl(z0, __ B, p0, 5);", "lsl\tz0.b, p0/m, z0.b, #5"],
|
|
["lsl", "__ sve_lsl(z1, __ H, p1, 15);", "lsl\tz1.h, p1/m, z1.h, #15"],
|
|
["lsl", "__ sve_lsl(z2, __ S, p2, 31);", "lsl\tz2.s, p2/m, z2.s, #31"],
|
|
["lsl", "__ sve_lsl(z3, __ D, p3, 63);", "lsl\tz3.d, p3/m, z3.d, #63"],
|
|
["lsr", "__ sve_lsr(z0, __ B, p0, 1);", "lsr\tz0.b, p0/m, z0.b, #1"],
|
|
["lsr", "__ sve_lsr(z0, __ B, p0, 8);", "lsr\tz0.b, p0/m, z0.b, #8"],
|
|
["lsr", "__ sve_lsr(z1, __ H, p1, 15);", "lsr\tz1.h, p1/m, z1.h, #15"],
|
|
["lsr", "__ sve_lsr(z2, __ S, p2, 7);", "lsr\tz2.s, p2/m, z2.s, #7"],
|
|
["lsr", "__ sve_lsr(z2, __ S, p2, 31);", "lsr\tz2.s, p2/m, z2.s, #31"],
|
|
["lsr", "__ sve_lsr(z3, __ D, p3, 63);", "lsr\tz3.d, p3/m, z3.d, #63"],
|
|
["asr", "__ sve_asr(z0, __ B, p0, 1);", "asr\tz0.b, p0/m, z0.b, #1"],
|
|
["asr", "__ sve_asr(z0, __ B, p0, 7);", "asr\tz0.b, p0/m, z0.b, #7"],
|
|
["asr", "__ sve_asr(z1, __ H, p1, 5);", "asr\tz1.h, p1/m, z1.h, #5"],
|
|
["asr", "__ sve_asr(z1, __ H, p1, 15);", "asr\tz1.h, p1/m, z1.h, #15"],
|
|
["asr", "__ sve_asr(z2, __ S, p2, 31);", "asr\tz2.s, p2/m, z2.s, #31"],
|
|
["asr", "__ sve_asr(z3, __ D, p3, 63);", "asr\tz3.d, p3/m, z3.d, #63"],
|
|
["addvl", "__ sve_addvl(sp, r0, 31);", "addvl\tsp, x0, #31"],
|
|
["addpl", "__ sve_addpl(r1, sp, -32);", "addpl\tx1, sp, -32"],
|
|
["cntp", "__ sve_cntp(r8, __ B, p0, p1);", "cntp\tx8, p0, p1.b"],
|
|
["dup", "__ sve_dup(z0, __ B, 127);", "dup\tz0.b, 127"],
|
|
["dup", "__ sve_dup(z1, __ H, -128);", "dup\tz1.h, -128"],
|
|
["dup", "__ sve_dup(z2, __ S, 32512);", "dup\tz2.s, 32512"],
|
|
["dup", "__ sve_dup(z7, __ D, -32768);", "dup\tz7.d, -32768"],
|
|
["dup", "__ sve_dup(z10, __ B, -1);", "dup\tz10.b, -1"],
|
|
["dup", "__ sve_dup(z11, __ S, -1);", "dup\tz11.s, -1"],
|
|
["ld1b", "__ sve_ld1b(z0, __ B, p0, Address(sp));", "ld1b\t{z0.b}, p0/z, [sp]"],
|
|
["ld1b", "__ sve_ld1b(z0, __ H, p1, Address(sp));", "ld1b\t{z0.h}, p1/z, [sp]"],
|
|
["ld1b", "__ sve_ld1b(z0, __ S, p2, Address(sp, r8));", "ld1b\t{z0.s}, p2/z, [sp, x8]"],
|
|
["ld1b", "__ sve_ld1b(z0, __ D, p3, Address(sp, 7));", "ld1b\t{z0.d}, p3/z, [sp, #7, MUL VL]"],
|
|
["ld1h", "__ sve_ld1h(z10, __ H, p1, Address(sp, -8));", "ld1h\t{z10.h}, p1/z, [sp, #-8, MUL VL]"],
|
|
["ld1w", "__ sve_ld1w(z20, __ S, p2, Address(r0, 7));", "ld1w\t{z20.s}, p2/z, [x0, #7, MUL VL]"],
|
|
["ld1b", "__ sve_ld1b(z30, __ B, p3, Address(sp, r8));", "ld1b\t{z30.b}, p3/z, [sp, x8]"],
|
|
["ld1w", "__ sve_ld1w(z0, __ S, p4, Address(sp, r28));", "ld1w\t{z0.s}, p4/z, [sp, x28, LSL #2]"],
|
|
["ld1d", "__ sve_ld1d(z11, __ D, p5, Address(r0, r1));", "ld1d\t{z11.d}, p5/z, [x0, x1, LSL #3]"],
|
|
["st1b", "__ sve_st1b(z22, __ B, p6, Address(sp));", "st1b\t{z22.b}, p6, [sp]"],
|
|
["st1b", "__ sve_st1b(z31, __ B, p7, Address(sp, -8));", "st1b\t{z31.b}, p7, [sp, #-8, MUL VL]"],
|
|
["st1b", "__ sve_st1b(z0, __ H, p1, Address(sp));", "st1b\t{z0.h}, p1, [sp]"],
|
|
["st1b", "__ sve_st1b(z0, __ S, p2, Address(sp, r8));", "st1b\t{z0.s}, p2, [sp, x8]"],
|
|
["st1b", "__ sve_st1b(z0, __ D, p3, Address(sp));", "st1b\t{z0.d}, p3, [sp]"],
|
|
["st1w", "__ sve_st1w(z0, __ S, p1, Address(r0, 7));", "st1w\t{z0.s}, p1, [x0, #7, MUL VL]"],
|
|
["st1b", "__ sve_st1b(z0, __ B, p2, Address(sp, r1));", "st1b\t{z0.b}, p2, [sp, x1]"],
|
|
["st1h", "__ sve_st1h(z0, __ H, p3, Address(sp, r8));", "st1h\t{z0.h}, p3, [sp, x8, LSL #1]"],
|
|
["st1d", "__ sve_st1d(z0, __ D, p4, Address(r0, r17));", "st1d\t{z0.d}, p4, [x0, x17, LSL #3]"],
|
|
["ldr", "__ sve_ldr(z0, Address(sp));", "ldr\tz0, [sp]"],
|
|
["ldr", "__ sve_ldr(z31, Address(sp, -256));", "ldr\tz31, [sp, #-256, MUL VL]"],
|
|
["str", "__ sve_str(z8, Address(r8, 255));", "str\tz8, [x8, #255, MUL VL]"],
|
|
["cntb", "__ sve_cntb(r9);", "cntb\tx9"],
|
|
["cnth", "__ sve_cnth(r10);", "cnth\tx10"],
|
|
["cntw", "__ sve_cntw(r11);", "cntw\tx11"],
|
|
["cntd", "__ sve_cntd(r12);", "cntd\tx12"],
|
|
["brka", "__ sve_brka(p2, p0, p2, false);", "brka\tp2.b, p0/z, p2.b"],
|
|
["brka", "__ sve_brka(p1, p2, p3, true);", "brka\tp1.b, p2/m, p3.b"],
|
|
["brkb", "__ sve_brkb(p1, p2, p3, false);", "brkb\tp1.b, p2/z, p3.b"],
|
|
["brkb", "__ sve_brkb(p2, p3, p4, true);", "brkb\tp2.b, p3/m, p4.b"],
|
|
["rev", "__ sve_rev(p0, __ B, p1);", "rev\tp0.b, p1.b"],
|
|
["rev", "__ sve_rev(p1, __ H, p2);", "rev\tp1.h, p2.h"],
|
|
["rev", "__ sve_rev(p2, __ S, p3);", "rev\tp2.s, p3.s"],
|
|
["rev", "__ sve_rev(p3, __ D, p4);", "rev\tp3.d, p4.d"],
|
|
["incp", "__ sve_incp(r0, __ B, p2);", "incp\tx0, p2.b"],
|
|
["whilelt", "__ sve_whilelt(p0, __ B, r1, r28);", "whilelt\tp0.b, x1, x28"],
|
|
["whilele", "__ sve_whilele(p2, __ H, r11, r8);", "whilele\tp2.h, x11, x8"],
|
|
["whilelo", "__ sve_whilelo(p3, __ S, r7, r2);", "whilelo\tp3.s, x7, x2"],
|
|
["whilels", "__ sve_whilels(p4, __ D, r17, r10);", "whilels\tp4.d, x17, x10"],
|
|
["whileltw", "__ sve_whileltw(p1, __ B, r1, r28);", "whilelt\tp1.b, w1, w28"],
|
|
["whilelew", "__ sve_whilelew(p2, __ H, r11, r8);", "whilele\tp2.h, w11, w8"],
|
|
["whilelow", "__ sve_whilelow(p3, __ S, r7, r2);", "whilelo\tp3.s, w7, w2"],
|
|
["whilelsw", "__ sve_whilelsw(p4, __ D, r17, r10);", "whilels\tp4.d, w17, w10"],
|
|
["sel", "__ sve_sel(z0, __ B, p0, z1, z2);", "sel\tz0.b, p0, z1.b, z2.b"],
|
|
["sel", "__ sve_sel(z4, __ D, p0, z5, z6);", "sel\tz4.d, p0, z5.d, z6.d"],
|
|
["cmpeq", "__ sve_cmp(Assembler::EQ, p1, __ B, p0, z0, z1);", "cmpeq\tp1.b, p0/z, z0.b, z1.b"],
|
|
["cmpne", "__ sve_cmp(Assembler::NE, p1, __ H, p0, z2, z3);", "cmpne\tp1.h, p0/z, z2.h, z3.h"],
|
|
["cmpge", "__ sve_cmp(Assembler::GE, p1, __ S, p2, z4, z5);", "cmpge\tp1.s, p2/z, z4.s, z5.s"],
|
|
["cmpgt", "__ sve_cmp(Assembler::GT, p1, __ D, p3, z6, z7);", "cmpgt\tp1.d, p3/z, z6.d, z7.d"],
|
|
["cmphi", "__ sve_cmp(Assembler::HI, p1, __ S, p2, z4, z5);", "cmphi\tp1.s, p2/z, z4.s, z5.s"],
|
|
["cmphs", "__ sve_cmp(Assembler::HS, p1, __ D, p3, z6, z7);", "cmphs\tp1.d, p3/z, z6.d, z7.d"],
|
|
["cmpeq", "__ sve_cmp(Assembler::EQ, p1, __ B, p4, z0, 15);", "cmpeq\tp1.b, p4/z, z0.b, #15"],
|
|
["cmpne", "__ sve_cmp(Assembler::NE, p1, __ H, p0, z2, -16);", "cmpne\tp1.h, p0/z, z2.h, #-16"],
|
|
["cmple", "__ sve_cmp(Assembler::LE, p1, __ S, p1, z4, 0);", "cmple\tp1.s, p1/z, z4.s, #0"],
|
|
["cmplt", "__ sve_cmp(Assembler::LT, p1, __ D, p2, z6, -1);", "cmplt\tp1.d, p2/z, z6.d, #-1"],
|
|
["cmpge", "__ sve_cmp(Assembler::GE, p1, __ S, p3, z4, 5);", "cmpge\tp1.s, p3/z, z4.s, #5"],
|
|
["cmpgt", "__ sve_cmp(Assembler::GT, p1, __ B, p4, z6, -2);", "cmpgt\tp1.b, p4/z, z6.b, #-2"],
|
|
["fcmeq", "__ sve_fcm(Assembler::EQ, p1, __ S, p0, z0, z1);", "fcmeq\tp1.s, p0/z, z0.s, z1.s"],
|
|
["fcmne", "__ sve_fcm(Assembler::NE, p1, __ D, p0, z2, z3);", "fcmne\tp1.d, p0/z, z2.d, z3.d"],
|
|
["fcmgt", "__ sve_fcm(Assembler::GT, p1, __ S, p2, z4, z5);", "fcmgt\tp1.s, p2/z, z4.s, z5.s"],
|
|
["fcmge", "__ sve_fcm(Assembler::GE, p1, __ D, p3, z6, z7);", "fcmge\tp1.d, p3/z, z6.d, z7.d"],
|
|
["uunpkhi", "__ sve_uunpkhi(z0, __ H, z1);", "uunpkhi\tz0.h, z1.b"],
|
|
["uunpklo", "__ sve_uunpklo(z4, __ S, z5);", "uunpklo\tz4.s, z5.h"],
|
|
["sunpkhi", "__ sve_sunpkhi(z6, __ D, z7);", "sunpkhi\tz6.d, z7.s"],
|
|
["sunpklo", "__ sve_sunpklo(z10, __ H, z11);", "sunpklo\tz10.h, z11.b"],
|
|
["scvtf", "__ sve_scvtf(z1, __ D, p0, z0, __ S);", "scvtf\tz1.d, p0/m, z0.s"],
|
|
["scvtf", "__ sve_scvtf(z3, __ D, p1, z2, __ D);", "scvtf\tz3.d, p1/m, z2.d"],
|
|
["scvtf", "__ sve_scvtf(z6, __ S, p2, z1, __ D);", "scvtf\tz6.s, p2/m, z1.d"],
|
|
["scvtf", "__ sve_scvtf(z6, __ S, p3, z1, __ S);", "scvtf\tz6.s, p3/m, z1.s"],
|
|
["scvtf", "__ sve_scvtf(z6, __ H, p3, z1, __ S);", "scvtf\tz6.h, p3/m, z1.s"],
|
|
["scvtf", "__ sve_scvtf(z6, __ H, p3, z1, __ D);", "scvtf\tz6.h, p3/m, z1.d"],
|
|
["scvtf", "__ sve_scvtf(z6, __ H, p3, z1, __ H);", "scvtf\tz6.h, p3/m, z1.h"],
|
|
["fcvt", "__ sve_fcvt(z5, __ D, p3, z4, __ S);", "fcvt\tz5.d, p3/m, z4.s"],
|
|
["fcvt", "__ sve_fcvt(z1, __ S, p3, z0, __ D);", "fcvt\tz1.s, p3/m, z0.d"],
|
|
["fcvtzs", "__ sve_fcvtzs(z19, __ D, p2, z1, __ D);", "fcvtzs\tz19.d, p2/m, z1.d"],
|
|
["fcvtzs", "__ sve_fcvtzs(z9, __ S, p1, z8, __ S);", "fcvtzs\tz9.s, p1/m, z8.s"],
|
|
["fcvtzs", "__ sve_fcvtzs(z1, __ S, p2, z0, __ D);", "fcvtzs\tz1.s, p2/m, z0.d"],
|
|
["fcvtzs", "__ sve_fcvtzs(z1, __ D, p3, z0, __ S);", "fcvtzs\tz1.d, p3/m, z0.s"],
|
|
["fcvtzs", "__ sve_fcvtzs(z1, __ S, p4, z18, __ H);", "fcvtzs\tz1.s, p4/m, z18.h"],
|
|
["lasta", "__ sve_lasta(r0, __ B, p0, z15);", "lasta\tw0, p0, z15.b"],
|
|
["lastb", "__ sve_lastb(r1, __ B, p1, z16);", "lastb\tw1, p1, z16.b"],
|
|
["lasta", "__ sve_lasta(v0, __ B, p0, z15);", "lasta\tb0, p0, z15.b"],
|
|
["lastb", "__ sve_lastb(v1, __ B, p1, z16);", "lastb\tb1, p1, z16.b"],
|
|
["index", "__ sve_index(z6, __ S, 1, 1);", "index\tz6.s, #1, #1"],
|
|
["index", "__ sve_index(z6, __ B, r5, 2);", "index\tz6.b, w5, #2"],
|
|
["index", "__ sve_index(z6, __ H, r5, 3);", "index\tz6.h, w5, #3"],
|
|
["index", "__ sve_index(z6, __ S, r5, 4);", "index\tz6.s, w5, #4"],
|
|
["index", "__ sve_index(z7, __ D, r5, 5);", "index\tz7.d, x5, #5"],
|
|
["cpy", "__ sve_cpy(z7, __ H, p3, r5);", "cpy\tz7.h, p3/m, w5"],
|
|
["tbl", "__ sve_tbl(z16, __ S, z17, z18);", "tbl\tz16.s, {z17.s}, z18.s"],
|
|
["ld1w", "__ sve_ld1w_gather(z15, p0, r5, z16);", "ld1w\t{z15.s}, p0/z, [x5, z16.s, uxtw #2]"],
|
|
["ld1d", "__ sve_ld1d_gather(z15, p0, r5, z16);", "ld1d\t{z15.d}, p0/z, [x5, z16.d, uxtw #3]"],
|
|
["st1w", "__ sve_st1w_scatter(z15, p0, r5, z16);", "st1w\t{z15.s}, p0, [x5, z16.s, uxtw #2]"],
|
|
["st1d", "__ sve_st1d_scatter(z15, p0, r5, z16);", "st1d\t{z15.d}, p0, [x5, z16.d, uxtw #3]"],
|
|
["and", "__ sve_and(p0, p1, p2, p3);", "and\tp0.b, p1/z, p2.b, p3.b"],
|
|
["ands", "__ sve_ands(p4, p5, p6, p0);", "ands\tp4.b, p5/z, p6.b, p0.b"],
|
|
["eor", "__ sve_eor(p0, p1, p2, p3);", "eor\tp0.b, p1/z, p2.b, p3.b"],
|
|
["eors", "__ sve_eors(p5, p6, p0, p1);", "eors\tp5.b, p6/z, p0.b, p1.b"],
|
|
["orr", "__ sve_orr(p0, p1, p2, p3);", "orr\tp0.b, p1/z, p2.b, p3.b"],
|
|
["orrs", "__ sve_orrs(p9, p1, p4, p5);", "orrs\tp9.b, p1/z, p4.b, p5.b"],
|
|
["bic", "__ sve_bic(p10, p7, p9, p11);", "bic\tp10.b, p7/z, p9.b, p11.b"],
|
|
["ptest", "__ sve_ptest(p7, p1);", "ptest\tp7, p1.b"],
|
|
["ptrue", "__ sve_ptrue(p1, __ B);", "ptrue\tp1.b"],
|
|
["ptrue", "__ sve_ptrue(p1, __ B, 0b00001);", "ptrue\tp1.b, vl1"],
|
|
["ptrue", "__ sve_ptrue(p1, __ B, 0b00101);", "ptrue\tp1.b, vl5"],
|
|
["ptrue", "__ sve_ptrue(p1, __ B, 0b01001);", "ptrue\tp1.b, vl16"],
|
|
["ptrue", "__ sve_ptrue(p1, __ B, 0b01101);", "ptrue\tp1.b, vl256"],
|
|
["ptrue", "__ sve_ptrue(p2, __ H);", "ptrue\tp2.h"],
|
|
["ptrue", "__ sve_ptrue(p2, __ H, 0b00010);", "ptrue\tp2.h, vl2"],
|
|
["ptrue", "__ sve_ptrue(p2, __ H, 0b00110);", "ptrue\tp2.h, vl6"],
|
|
["ptrue", "__ sve_ptrue(p2, __ H, 0b01010);", "ptrue\tp2.h, vl32"],
|
|
["ptrue", "__ sve_ptrue(p3, __ S);", "ptrue\tp3.s"],
|
|
["ptrue", "__ sve_ptrue(p3, __ S, 0b00011);", "ptrue\tp3.s, vl3"],
|
|
["ptrue", "__ sve_ptrue(p3, __ S, 0b00111);", "ptrue\tp3.s, vl7"],
|
|
["ptrue", "__ sve_ptrue(p3, __ S, 0b01011);", "ptrue\tp3.s, vl64"],
|
|
["ptrue", "__ sve_ptrue(p4, __ D);", "ptrue\tp4.d"],
|
|
["ptrue", "__ sve_ptrue(p4, __ D, 0b00100);", "ptrue\tp4.d, vl4"],
|
|
["ptrue", "__ sve_ptrue(p4, __ D, 0b01000);", "ptrue\tp4.d, vl8"],
|
|
["ptrue", "__ sve_ptrue(p4, __ D, 0b01100);", "ptrue\tp4.d, vl128"],
|
|
["pfalse", "__ sve_pfalse(p7);", "pfalse\tp7.b"],
|
|
["uzp1", "__ sve_uzp1(p0, __ B, p0, p1);", "uzp1\tp0.b, p0.b, p1.b"],
|
|
["uzp1", "__ sve_uzp1(p0, __ H, p0, p1);", "uzp1\tp0.h, p0.h, p1.h"],
|
|
["uzp1", "__ sve_uzp1(p0, __ S, p0, p1);", "uzp1\tp0.s, p0.s, p1.s"],
|
|
["uzp1", "__ sve_uzp1(p0, __ D, p0, p1);", "uzp1\tp0.d, p0.d, p1.d"],
|
|
["uzp2", "__ sve_uzp2(p0, __ B, p0, p1);", "uzp2\tp0.b, p0.b, p1.b"],
|
|
["uzp2", "__ sve_uzp2(p0, __ H, p0, p1);", "uzp2\tp0.h, p0.h, p1.h"],
|
|
["uzp2", "__ sve_uzp2(p0, __ S, p0, p1);", "uzp2\tp0.s, p0.s, p1.s"],
|
|
["uzp2", "__ sve_uzp2(p0, __ D, p0, p1);", "uzp2\tp0.d, p0.d, p1.d"],
|
|
["punpklo", "__ sve_punpklo(p1, p0);", "punpklo\tp1.h, p0.b"],
|
|
["punpkhi", "__ sve_punpkhi(p1, p0);", "punpkhi\tp1.h, p0.b"],
|
|
["compact", "__ sve_compact(z16, __ S, z16, p1);", "compact\tz16.s, p1, z16.s"],
|
|
["compact", "__ sve_compact(z16, __ D, z16, p1);", "compact\tz16.d, p1, z16.d"],
|
|
["ext", "__ sve_ext(z17, z16, 63);", "ext\tz17.b, z17.b, z16.b, #63"],
|
|
# SVE2 instructions
|
|
["histcnt", "__ sve_histcnt(z16, __ S, p0, z16, z16);", "histcnt\tz16.s, p0/z, z16.s, z16.s"],
|
|
["histcnt", "__ sve_histcnt(z17, __ D, p0, z17, z17);", "histcnt\tz17.d, p0/z, z17.d, z17.d"],
|
|
])
|
|
|
|
print "\n// FloatImmediateOp"
|
|
for float in ("2.0", "2.125", "4.0", "4.25", "8.0", "8.5", "16.0", "17.0", "0.125",
|
|
"0.1328125", "0.25", "0.265625", "0.5", "0.53125", "1.0", "1.0625",
|
|
"-2.0", "-2.125", "-4.0", "-4.25", "-8.0", "-8.5", "-16.0", "-17.0",
|
|
"-0.125", "-0.1328125", "-0.25", "-0.265625", "-0.5", "-0.53125", "-1.0", "-1.0625"):
|
|
astr = "fmov d0, #" + float
|
|
cstr = "__ fmovd(v0, " + float + ");"
|
|
print " %-50s //\t%s" % (cstr, astr)
|
|
outfile.write("\t" + astr + "\n")
|
|
|
|
# ARMv8.1A
|
|
for size in ("x", "w"):
|
|
for suffix in ("", "a", "al", "l"):
|
|
generate(LSEOp, [["swp", "swp", size, suffix],
|
|
["ldadd", "ldadd", size, suffix],
|
|
["ldbic", "ldclr", size, suffix],
|
|
["ldeor", "ldeor", size, suffix],
|
|
["ldorr", "ldset", size, suffix],
|
|
["ldsmin", "ldsmin", size, suffix],
|
|
["ldsmax", "ldsmax", size, suffix],
|
|
["ldumin", "ldumin", size, suffix],
|
|
["ldumax", "ldumax", size, suffix]]);
|
|
|
|
# ARMv8.2A
|
|
generate(SHA3SIMDOp, ["bcax", "eor3", "rax1", "xar"])
|
|
|
|
generate(SHA512SIMDOp, ["sha512h", "sha512h2", "sha512su0", "sha512su1"])
|
|
|
|
for i in range(6):
|
|
generate(SVEBinaryImmOp, ["add", "sub", "and", "eor", "orr"])
|
|
|
|
generate(SVEVectorOp, [["add", "ZZZ"],
|
|
["sub", "ZZZ"],
|
|
["fadd", "ZZZ"],
|
|
["fmul", "ZZZ"],
|
|
["fsub", "ZZZ"],
|
|
["abs", "ZPZ", "m"],
|
|
["add", "ZPZ", "m", "dn"],
|
|
["and", "ZPZ", "m", "dn"],
|
|
["asr", "ZPZ", "m", "dn"],
|
|
["bic", "ZPZ", "m", "dn"],
|
|
["clz", "ZPZ", "m"],
|
|
["cnt", "ZPZ", "m"],
|
|
["eor", "ZPZ", "m", "dn"],
|
|
["lsl", "ZPZ", "m", "dn"],
|
|
["lsr", "ZPZ", "m", "dn"],
|
|
["mul", "ZPZ", "m", "dn"],
|
|
["neg", "ZPZ", "m"],
|
|
["not", "ZPZ", "m"],
|
|
["orr", "ZPZ", "m", "dn"],
|
|
["rbit", "ZPZ", "m"],
|
|
["revb", "ZPZ", "m"],
|
|
["smax", "ZPZ", "m", "dn"],
|
|
["smin", "ZPZ", "m", "dn"],
|
|
["sub", "ZPZ", "m", "dn"],
|
|
["fabs", "ZPZ", "m"],
|
|
["fadd", "ZPZ", "m", "dn"],
|
|
["fdiv", "ZPZ", "m", "dn"],
|
|
["fmax", "ZPZ", "m", "dn"],
|
|
["fmin", "ZPZ", "m", "dn"],
|
|
["fmul", "ZPZ", "m", "dn"],
|
|
["fneg", "ZPZ", "m"],
|
|
["frintm", "ZPZ", "m"],
|
|
["frintn", "ZPZ", "m"],
|
|
["frintp", "ZPZ", "m"],
|
|
["fsqrt", "ZPZ", "m"],
|
|
["fsub", "ZPZ", "m", "dn"],
|
|
["fmad", "ZPZZ", "m"],
|
|
["fmla", "ZPZZ", "m"],
|
|
["fmls", "ZPZZ", "m"],
|
|
["fmsb", "ZPZZ", "m"],
|
|
["fnmad", "ZPZZ", "m"],
|
|
["fnmsb", "ZPZZ", "m"],
|
|
["fnmla", "ZPZZ", "m"],
|
|
["fnmls", "ZPZZ", "m"],
|
|
["mla", "ZPZZ", "m"],
|
|
["mls", "ZPZZ", "m"],
|
|
["and", "ZZZ"],
|
|
["eor", "ZZZ"],
|
|
["orr", "ZZZ"],
|
|
["bic", "ZZZ"],
|
|
["uzp1", "ZZZ"],
|
|
["uzp2", "ZZZ"],
|
|
# SVE2 instructions
|
|
["bext", "ZZZ"],
|
|
["bdep", "ZZZ"],
|
|
])
|
|
|
|
generate(SVEReductionOp, [["andv", 0], ["orv", 0], ["eorv", 0], ["smaxv", 0], ["sminv", 0],
|
|
["fminv", 2], ["fmaxv", 2], ["fadda", 2], ["uaddv", 0]])
|
|
|
|
print "\n __ bind(forth);"
|
|
outfile.write("forth:\n")
|
|
|
|
outfile.close()
|
|
|
|
# compile for sve with armv9-a+sha3+sve2-bitperm because of SHA3 crypto extension and SVE2 bitperm instructions.
|
|
# armv9-a enables sve and sve2 by default.
|
|
subprocess.check_call([AARCH64_AS, "-march=armv9-a+sha3+sve2-bitperm", "aarch64ops.s", "-o", "aarch64ops.o"])
|
|
|
|
print
|
|
print "/*"
|
|
print "*/"
|
|
|
|
subprocess.check_call([AARCH64_OBJCOPY, "-O", "binary", "-j", ".text", "aarch64ops.o", "aarch64ops.bin"])
|
|
|
|
infile = open("aarch64ops.bin", "r")
|
|
bytes = bytearray(infile.read())
|
|
|
|
print
|
|
print " static const unsigned int insns[] ="
|
|
print " {"
|
|
|
|
i = 0
|
|
while i < len(bytes):
|
|
print " 0x%02x%02x%02x%02x," % (bytes[i+3], bytes[i+2], bytes[i+1], bytes[i]),
|
|
i += 4
|
|
if i%16 == 0:
|
|
print
|
|
print
|
|
print " };"
|
|
print "// END Generated code -- do not edit"
|
|
|
|
infile.close()
|
|
|
|
for f in ["aarch64ops.s", "aarch64ops.o", "aarch64ops.bin"]:
|
|
os.remove(f)
|