91117bc546
Tests for correct operation of most x86-64 SSE instructions. It should cover all combinations of overlapping register and memory operands on a set of random-ish data. Results are bit-identical to an Intel i5-8500, with the exception of the RCPSS and RSQRT approximations where the real CPU gives less accurate results (the Intel spec allows relative errors up to 1.5 * 2^-12) Signed-off-by: Paul Brook <paul@nowt.org> Acked-by: Alex Bennée <alex.bennee@linaro.org> Message-Id: <20220424220204.2493824-42-paul@nowt.org> Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
352 lines
9.6 KiB
Python
Executable File
352 lines
9.6 KiB
Python
Executable File
#! /usr/bin/env python3
|
|
|
|
# Generate test-avx.h from x86.csv
|
|
|
|
import csv
|
|
import sys
|
|
from fnmatch import fnmatch
|
|
|
|
archs = [
|
|
# TODO: MMX?
|
|
"SSE", "SSE2", "SSE3", "SSSE3", "SSE4_1", "SSE4_2",
|
|
]
|
|
|
|
ignore = set(["FISTTP",
|
|
"LDMXCSR", "VLDMXCSR", "STMXCSR", "VSTMXCSR"])
|
|
|
|
imask = {
|
|
'vBLENDPD': 0xff,
|
|
'vBLENDPS': 0x0f,
|
|
'CMP[PS][SD]': 0x07,
|
|
'VCMP[PS][SD]': 0x1f,
|
|
'vDPPD': 0x33,
|
|
'vDPPS': 0xff,
|
|
'vEXTRACTPS': 0x03,
|
|
'vINSERTPS': 0xff,
|
|
'MPSADBW': 0x7,
|
|
'VMPSADBW': 0x3f,
|
|
'vPALIGNR': 0x3f,
|
|
'vPBLENDW': 0xff,
|
|
'vPCMP[EI]STR*': 0x0f,
|
|
'vPEXTRB': 0x0f,
|
|
'vPEXTRW': 0x07,
|
|
'vPEXTRD': 0x03,
|
|
'vPEXTRQ': 0x01,
|
|
'vPINSRB': 0x0f,
|
|
'vPINSRW': 0x07,
|
|
'vPINSRD': 0x03,
|
|
'vPINSRQ': 0x01,
|
|
'vPSHUF[DW]': 0xff,
|
|
'vPSHUF[LH]W': 0xff,
|
|
'vPS[LR][AL][WDQ]': 0x3f,
|
|
'vPS[RL]LDQ': 0x1f,
|
|
'vROUND[PS][SD]': 0x7,
|
|
'vSHUFPD': 0x0f,
|
|
'vSHUFPS': 0xff,
|
|
'vAESKEYGENASSIST': 0,
|
|
'VEXTRACT[FI]128': 0x01,
|
|
'VINSERT[FI]128': 0x01,
|
|
'VPBLENDD': 0xff,
|
|
'VPERM2[FI]128': 0x33,
|
|
'VPERMPD': 0xff,
|
|
'VPERMQ': 0xff,
|
|
'VPERMILPS': 0xff,
|
|
'VPERMILPD': 0x0f,
|
|
}
|
|
|
|
def strip_comments(x):
|
|
for l in x:
|
|
if l != '' and l[0] != '#':
|
|
yield l
|
|
|
|
def reg_w(w):
|
|
if w == 8:
|
|
return 'al'
|
|
elif w == 16:
|
|
return 'ax'
|
|
elif w == 32:
|
|
return 'eax'
|
|
elif w == 64:
|
|
return 'rax'
|
|
raise Exception("bad reg_w %d" % w)
|
|
|
|
def mem_w(w):
|
|
if w == 8:
|
|
t = "BYTE"
|
|
elif w == 16:
|
|
t = "WORD"
|
|
elif w == 32:
|
|
t = "DWORD"
|
|
elif w == 64:
|
|
t = "QWORD"
|
|
elif w == 128:
|
|
t = "XMMWORD"
|
|
elif w == 256:
|
|
t = "YMMWORD"
|
|
else:
|
|
raise Exception()
|
|
|
|
return t + " PTR 16[rdx]"
|
|
|
|
class XMMArg():
|
|
isxmm = True
|
|
def __init__(self, reg, mw):
|
|
if mw not in [0, 8, 16, 32, 64, 128, 256]:
|
|
raise Exception("Bad /m width: %s" % w)
|
|
self.reg = reg
|
|
self.mw = mw
|
|
self.ismem = mw != 0
|
|
def regstr(self, n):
|
|
if n < 0:
|
|
return mem_w(self.mw)
|
|
else:
|
|
return "%smm%d" % (self.reg, n)
|
|
|
|
class MMArg():
|
|
isxmm = True
|
|
ismem = False # TODO
|
|
def regstr(self, n):
|
|
return "mm%d" % (n & 7)
|
|
|
|
def match(op, pattern):
|
|
if pattern[0] == 'v':
|
|
return fnmatch(op, pattern[1:]) or fnmatch(op, 'V'+pattern[1:])
|
|
return fnmatch(op, pattern)
|
|
|
|
class ArgVSIB():
|
|
isxmm = True
|
|
ismem = False
|
|
def __init__(self, reg, w):
|
|
if w not in [32, 64]:
|
|
raise Exception("Bad vsib width: %s" % w)
|
|
self.w = w
|
|
self.reg = reg
|
|
def regstr(self, n):
|
|
reg = "%smm%d" % (self.reg, n >> 2)
|
|
return "[rsi + %s * %d]" % (reg, 1 << (n & 3))
|
|
|
|
class ArgImm8u():
|
|
isxmm = False
|
|
ismem = False
|
|
def __init__(self, op):
|
|
for k, v in imask.items():
|
|
if match(op, k):
|
|
self.mask = imask[k];
|
|
return
|
|
raise Exception("Unknown immediate")
|
|
def vals(self):
|
|
mask = self.mask
|
|
yield 0
|
|
n = 0
|
|
while n != mask:
|
|
n += 1
|
|
while (n & ~mask) != 0:
|
|
n += (n & ~mask)
|
|
yield n
|
|
|
|
class ArgRM():
|
|
isxmm = False
|
|
def __init__(self, rw, mw):
|
|
if rw not in [8, 16, 32, 64]:
|
|
raise Exception("Bad r/w width: %s" % w)
|
|
if mw not in [0, 8, 16, 32, 64]:
|
|
raise Exception("Bad r/w width: %s" % w)
|
|
self.rw = rw
|
|
self.mw = mw
|
|
self.ismem = mw != 0
|
|
def regstr(self, n):
|
|
if n < 0:
|
|
return mem_w(self.mw)
|
|
else:
|
|
return reg_w(self.rw)
|
|
|
|
class ArgMem():
|
|
isxmm = False
|
|
ismem = True
|
|
def __init__(self, w):
|
|
if w not in [8, 16, 32, 64, 128, 256]:
|
|
raise Exception("Bad mem width: %s" % w)
|
|
self.w = w
|
|
def regstr(self, n):
|
|
return mem_w(self.w)
|
|
|
|
def ArgGenerator(arg, op):
|
|
if arg[:3] == 'xmm' or arg[:3] == "ymm":
|
|
if "/" in arg:
|
|
r, m = arg.split('/')
|
|
if (m[0] != 'm'):
|
|
raise Exception("Expected /m: %s", arg)
|
|
return XMMArg(arg[0], int(m[1:]));
|
|
else:
|
|
return XMMArg(arg[0], 0);
|
|
elif arg[:2] == 'mm':
|
|
return MMArg();
|
|
elif arg[:4] == 'imm8':
|
|
return ArgImm8u(op);
|
|
elif arg == '<XMM0>':
|
|
return None
|
|
elif arg[0] == 'r':
|
|
if '/m' in arg:
|
|
r, m = arg.split('/')
|
|
if (m[0] != 'm'):
|
|
raise Exception("Expected /m: %s", arg)
|
|
mw = int(m[1:])
|
|
if r == 'r':
|
|
rw = mw
|
|
else:
|
|
rw = int(r[1:])
|
|
return ArgRM(rw, mw)
|
|
|
|
return ArgRM(int(arg[1:]), 0);
|
|
elif arg[0] == 'm':
|
|
return ArgMem(int(arg[1:]))
|
|
elif arg[:2] == 'vm':
|
|
return ArgVSIB(arg[-1], int(arg[2:-1]))
|
|
else:
|
|
raise Exception("Unrecognised arg: %s", arg)
|
|
|
|
class InsnGenerator:
|
|
def __init__(self, op, args):
|
|
self.op = op
|
|
if op[-2:] in ["PS", "PD", "SS", "SD"]:
|
|
if op[-1] == 'S':
|
|
self.optype = 'F32'
|
|
else:
|
|
self.optype = 'F64'
|
|
else:
|
|
self.optype = 'I'
|
|
|
|
try:
|
|
self.args = list(ArgGenerator(a, op) for a in args)
|
|
if len(self.args) > 0 and self.args[-1] is None:
|
|
self.args = self.args[:-1]
|
|
except Exception as e:
|
|
raise Exception("Bad arg %s: %s" % (op, e))
|
|
|
|
def gen(self):
|
|
regs = (10, 11, 12)
|
|
dest = 9
|
|
|
|
nreg = len(self.args)
|
|
if nreg == 0:
|
|
yield self.op
|
|
return
|
|
if isinstance(self.args[-1], ArgImm8u):
|
|
nreg -= 1
|
|
immarg = self.args[-1]
|
|
else:
|
|
immarg = None
|
|
memarg = -1
|
|
for n, arg in enumerate(self.args):
|
|
if arg.ismem:
|
|
memarg = n
|
|
|
|
if (self.op.startswith("VGATHER") or self.op.startswith("VPGATHER")):
|
|
if "GATHERD" in self.op:
|
|
ireg = 13 << 2
|
|
else:
|
|
ireg = 14 << 2
|
|
regset = [
|
|
(dest, ireg | 0, regs[0]),
|
|
(dest, ireg | 1, regs[0]),
|
|
(dest, ireg | 2, regs[0]),
|
|
(dest, ireg | 3, regs[0]),
|
|
]
|
|
if memarg >= 0:
|
|
raise Exception("vsib with memory: %s" % self.op)
|
|
elif nreg == 1:
|
|
regset = [(regs[0],)]
|
|
if memarg == 0:
|
|
regset += [(-1,)]
|
|
elif nreg == 2:
|
|
regset = [
|
|
(regs[0], regs[1]),
|
|
(regs[0], regs[0]),
|
|
]
|
|
if memarg == 0:
|
|
regset += [(-1, regs[0])]
|
|
elif memarg == 1:
|
|
regset += [(dest, -1)]
|
|
elif nreg == 3:
|
|
regset = [
|
|
(dest, regs[0], regs[1]),
|
|
(dest, regs[0], regs[0]),
|
|
(regs[0], regs[0], regs[1]),
|
|
(regs[0], regs[1], regs[0]),
|
|
(regs[0], regs[0], regs[0]),
|
|
]
|
|
if memarg == 2:
|
|
regset += [
|
|
(dest, regs[0], -1),
|
|
(regs[0], regs[0], -1),
|
|
]
|
|
elif memarg > 0:
|
|
raise Exception("Memarg %d" % memarg)
|
|
elif nreg == 4:
|
|
regset = [
|
|
(dest, regs[0], regs[1], regs[2]),
|
|
(dest, regs[0], regs[0], regs[1]),
|
|
(dest, regs[0], regs[1], regs[0]),
|
|
(dest, regs[1], regs[0], regs[0]),
|
|
(dest, regs[0], regs[0], regs[0]),
|
|
(regs[0], regs[0], regs[1], regs[2]),
|
|
(regs[0], regs[1], regs[0], regs[2]),
|
|
(regs[0], regs[1], regs[2], regs[0]),
|
|
(regs[0], regs[0], regs[0], regs[1]),
|
|
(regs[0], regs[0], regs[1], regs[0]),
|
|
(regs[0], regs[1], regs[0], regs[0]),
|
|
(regs[0], regs[0], regs[0], regs[0]),
|
|
]
|
|
if memarg == 2:
|
|
regset += [
|
|
(dest, regs[0], -1, regs[1]),
|
|
(dest, regs[0], -1, regs[0]),
|
|
(regs[0], regs[0], -1, regs[1]),
|
|
(regs[0], regs[1], -1, regs[0]),
|
|
(regs[0], regs[0], -1, regs[0]),
|
|
]
|
|
elif memarg > 0:
|
|
raise Exception("Memarg4 %d" % memarg)
|
|
else:
|
|
raise Exception("Too many regs: %s(%d)" % (self.op, nreg))
|
|
|
|
for regv in regset:
|
|
argstr = []
|
|
for i in range(nreg):
|
|
arg = self.args[i]
|
|
argstr.append(arg.regstr(regv[i]))
|
|
if immarg is None:
|
|
yield self.op + ' ' + ','.join(argstr)
|
|
else:
|
|
for immval in immarg.vals():
|
|
yield self.op + ' ' + ','.join(argstr) + ',' + str(immval)
|
|
|
|
def split0(s):
|
|
if s == '':
|
|
return []
|
|
return s.split(',')
|
|
|
|
def main():
|
|
n = 0
|
|
if len(sys.argv) != 3:
|
|
print("Usage: test-avx.py x86.csv test-avx.h")
|
|
exit(1)
|
|
csvfile = open(sys.argv[1], 'r', newline='')
|
|
with open(sys.argv[2], "w") as outf:
|
|
outf.write("// Generated by test-avx.py. Do not edit.\n")
|
|
for row in csv.reader(strip_comments(csvfile)):
|
|
insn = row[0].replace(',', '').split()
|
|
if insn[0] in ignore:
|
|
continue
|
|
cpuid = row[6]
|
|
if cpuid in archs:
|
|
g = InsnGenerator(insn[0], insn[1:])
|
|
for insn in g.gen():
|
|
outf.write('TEST(%d, "%s", %s)\n' % (n, insn, g.optype))
|
|
n += 1
|
|
outf.write("#undef TEST\n")
|
|
csvfile.close()
|
|
|
|
if __name__ == "__main__":
|
|
main()
|