X86: Implement a "sum of absolute differences" microop.
This commit is contained in:
parent
31d29ee3f8
commit
470dcef229
1 changed files with 19 additions and 0 deletions
|
@ -948,6 +948,25 @@ let {{
|
||||||
FpDestReg.uqw = result;
|
FpDestReg.uqw = result;
|
||||||
'''
|
'''
|
||||||
|
|
||||||
|
class Msad(MediaOp):
|
||||||
|
code = '''
|
||||||
|
int srcBits = srcSize * 8;
|
||||||
|
int items = sizeof(FloatRegBits) / srcSize;
|
||||||
|
|
||||||
|
uint64_t sum = 0;
|
||||||
|
for (int i = 0; i < items; i++) {
|
||||||
|
int hiIndex = (i + 1) * srcBits - 1;
|
||||||
|
int loIndex = (i + 0) * srcBits;
|
||||||
|
uint64_t arg1Bits = bits(FpSrcReg1.uqw, hiIndex, loIndex);
|
||||||
|
uint64_t arg2Bits = bits(FpSrcReg2.uqw, hiIndex, loIndex);
|
||||||
|
int64_t resBits = arg1Bits - arg2Bits;
|
||||||
|
if (resBits < 0)
|
||||||
|
resBits = -resBits;
|
||||||
|
sum += resBits;
|
||||||
|
}
|
||||||
|
FpDestReg.uqw = sum & mask(destSize * 8);
|
||||||
|
'''
|
||||||
|
|
||||||
class Cvti2f(MediaOp):
|
class Cvti2f(MediaOp):
|
||||||
def __init__(self, dest, src, \
|
def __init__(self, dest, src, \
|
||||||
size = None, destSize = None, srcSize = None, ext = None):
|
size = None, destSize = None, srcSize = None, ext = None):
|
||||||
|
|
Loading…
Reference in a new issue