arch, x86: add support for arrays as memory operands
Although the cache models support wider accesses, the ISA descriptions assume that (for the most part) memory operands are integer types, which makes it difficult to define instructions that do memory accesses larger than 64 bits. This patch adds some generic support for memory operands that are arrays of uint64_t, and specifically a 'u2qw' operand type for x86 that is an array of 2 uint64_ts (128 bits). This support is unused at this point, but will be needed shortly for cmpxchg16b. Ideally the 128-bit SSE memory accesses will also be rewritten to use this support. Support for 128-bit accesses could also have been added using the gcc __int128_t extension, which would have been less disruptive. However, although clang also supports __int128_t, it's still non-standard. Also, more importantly, this approach creates a path to defining 256- and 512-byte operands as well, which will be useful for eventual AVX support.
This commit is contained in:
parent
f5343df1e1
commit
5200e04e92
5 changed files with 112 additions and 8 deletions
|
@ -1053,9 +1053,14 @@ stringRE = re.compile(r'"([^"\\]|\\.)*"')
|
||||||
commentRE = re.compile(r'(^)?[^\S\n]*/(?:\*(.*?)\*/[^\S\n]*|/[^\n]*)($)?',
|
commentRE = re.compile(r'(^)?[^\S\n]*/(?:\*(.*?)\*/[^\S\n]*|/[^\n]*)($)?',
|
||||||
re.DOTALL | re.MULTILINE)
|
re.DOTALL | re.MULTILINE)
|
||||||
|
|
||||||
# Regular expression object to match assignment statements
|
# Regular expression object to match assignment statements (used in
|
||||||
# (used in findOperands())
|
# findOperands()). If the code immediately following the first
|
||||||
assignRE = re.compile(r'\s*=(?!=)', re.MULTILINE)
|
# appearance of the operand matches this regex, then the operand
|
||||||
|
# appears to be on the LHS of an assignment, and is thus a
|
||||||
|
# destination. basically we're looking for an '=' that's not '=='.
|
||||||
|
# The heinous tangle before that handles the case where the operand
|
||||||
|
# has an array subscript.
|
||||||
|
assignRE = re.compile(r'(\[[^\]]+\])?\s*=(?!=)', re.MULTILINE)
|
||||||
|
|
||||||
def makeFlagConstructor(flag_list):
|
def makeFlagConstructor(flag_list):
|
||||||
if len(flag_list) == 0:
|
if len(flag_list) == 0:
|
||||||
|
|
|
@ -49,6 +49,7 @@ let {{
|
||||||
}};
|
}};
|
||||||
|
|
||||||
output header {{
|
output header {{
|
||||||
|
#include <array>
|
||||||
#include <cstring>
|
#include <cstring>
|
||||||
#include <iostream>
|
#include <iostream>
|
||||||
#include <sstream>
|
#include <sstream>
|
||||||
|
|
|
@ -143,7 +143,7 @@ def template MicroLoadCompleteAcc {{
|
||||||
%(op_decl)s;
|
%(op_decl)s;
|
||||||
%(op_rd)s;
|
%(op_rd)s;
|
||||||
|
|
||||||
Mem = getMem(pkt, dataSize, traceData);
|
getMem(pkt, Mem, dataSize, traceData);
|
||||||
|
|
||||||
%(code)s;
|
%(code)s;
|
||||||
|
|
||||||
|
|
|
@ -1,4 +1,5 @@
|
||||||
// Copyright (c) 2007-2008 The Hewlett-Packard Development Company
|
// Copyright (c) 2007-2008 The Hewlett-Packard Development Company
|
||||||
|
// Copyright (c) 2015 Advanced Micro Devices, Inc.
|
||||||
// All rights reserved.
|
// All rights reserved.
|
||||||
//
|
//
|
||||||
// The license below extends only to copyright in the software and shall
|
// The license below extends only to copyright in the software and shall
|
||||||
|
@ -49,6 +50,7 @@ def operand_types {{
|
||||||
'udw' : 'uint32_t',
|
'udw' : 'uint32_t',
|
||||||
'sqw' : 'int64_t',
|
'sqw' : 'int64_t',
|
||||||
'uqw' : 'uint64_t',
|
'uqw' : 'uint64_t',
|
||||||
|
'u2qw' : 'std::array<uint64_t, 2>',
|
||||||
'sf' : 'float',
|
'sf' : 'float',
|
||||||
'df' : 'double',
|
'df' : 'double',
|
||||||
}};
|
}};
|
||||||
|
|
|
@ -1,5 +1,6 @@
|
||||||
/*
|
/*
|
||||||
* Copyright (c) 2011 Google
|
* Copyright (c) 2011 Google
|
||||||
|
* Copyright (c) 2015 Advanced Micro Devices, Inc.
|
||||||
* All rights reserved.
|
* All rights reserved.
|
||||||
*
|
*
|
||||||
* Redistribution and use in source and binary forms, with or without
|
* Redistribution and use in source and binary forms, with or without
|
||||||
|
@ -31,6 +32,8 @@
|
||||||
#ifndef __ARCH_X86_MEMHELPERS_HH__
|
#ifndef __ARCH_X86_MEMHELPERS_HH__
|
||||||
#define __ARCH_X86_MEMHELPERS_HH__
|
#define __ARCH_X86_MEMHELPERS_HH__
|
||||||
|
|
||||||
|
#include <array>
|
||||||
|
|
||||||
#include "base/types.hh"
|
#include "base/types.hh"
|
||||||
#include "sim/byteswap.hh"
|
#include "sim/byteswap.hh"
|
||||||
#include "sim/insttracer.hh"
|
#include "sim/insttracer.hh"
|
||||||
|
@ -47,10 +50,10 @@ initiateMemRead(XC *xc, Trace::InstRecord *traceData, Addr addr,
|
||||||
return xc->initiateMemRead(addr, dataSize, flags);
|
return xc->initiateMemRead(addr, dataSize, flags);
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline uint64_t
|
static void
|
||||||
getMem(PacketPtr pkt, unsigned dataSize, Trace::InstRecord *traceData)
|
getMem(PacketPtr pkt, uint64_t &mem, unsigned dataSize,
|
||||||
|
Trace::InstRecord *traceData)
|
||||||
{
|
{
|
||||||
uint64_t mem;
|
|
||||||
switch (dataSize) {
|
switch (dataSize) {
|
||||||
case 1:
|
case 1:
|
||||||
mem = pkt->get<uint8_t>();
|
mem = pkt->get<uint8_t>();
|
||||||
|
@ -69,9 +72,31 @@ getMem(PacketPtr pkt, unsigned dataSize, Trace::InstRecord *traceData)
|
||||||
}
|
}
|
||||||
if (traceData)
|
if (traceData)
|
||||||
traceData->setData(mem);
|
traceData->setData(mem);
|
||||||
return mem;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
template <size_t N>
|
||||||
|
void
|
||||||
|
getMem(PacketPtr pkt, std::array<uint64_t, N> &mem, unsigned dataSize,
|
||||||
|
Trace::InstRecord *traceData)
|
||||||
|
{
|
||||||
|
assert(dataSize >= 8);
|
||||||
|
assert((dataSize % 8) == 0);
|
||||||
|
|
||||||
|
int num_words = dataSize / 8;
|
||||||
|
assert(num_words <= N);
|
||||||
|
|
||||||
|
auto pkt_data = pkt->getConstPtr<const uint64_t>();
|
||||||
|
for (int i = 0; i < num_words; ++i)
|
||||||
|
mem[i] = gtoh(pkt_data[i]);
|
||||||
|
|
||||||
|
// traceData record only has space for 64 bits, so we just record
|
||||||
|
// the first qword
|
||||||
|
if (traceData)
|
||||||
|
traceData->setData(mem[0]);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
template <class XC>
|
template <class XC>
|
||||||
Fault
|
Fault
|
||||||
readMemAtomic(XC *xc, Trace::InstRecord *traceData, Addr addr, uint64_t &mem,
|
readMemAtomic(XC *xc, Trace::InstRecord *traceData, Addr addr, uint64_t &mem,
|
||||||
|
@ -90,6 +115,30 @@ readMemAtomic(XC *xc, Trace::InstRecord *traceData, Addr addr, uint64_t &mem,
|
||||||
return fault;
|
return fault;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
template <class XC, size_t N>
|
||||||
|
Fault
|
||||||
|
readMemAtomic(XC *xc, Trace::InstRecord *traceData, Addr addr,
|
||||||
|
std::array<uint64_t, N> &mem, unsigned dataSize,
|
||||||
|
unsigned flags)
|
||||||
|
{
|
||||||
|
assert(dataSize >= 8);
|
||||||
|
assert((dataSize % 8) == 0);
|
||||||
|
|
||||||
|
Fault fault = xc->readMem(addr, (uint8_t *)&mem, dataSize, flags);
|
||||||
|
|
||||||
|
if (fault == NoFault) {
|
||||||
|
int num_words = dataSize / 8;
|
||||||
|
assert(num_words <= N);
|
||||||
|
|
||||||
|
for (int i = 0; i < num_words; ++i)
|
||||||
|
mem[i] = gtoh(mem[i]);
|
||||||
|
|
||||||
|
if (traceData)
|
||||||
|
traceData->setData(mem[0]);
|
||||||
|
}
|
||||||
|
return fault;
|
||||||
|
}
|
||||||
|
|
||||||
template <class XC>
|
template <class XC>
|
||||||
Fault
|
Fault
|
||||||
writeMemTiming(XC *xc, Trace::InstRecord *traceData, uint64_t mem,
|
writeMemTiming(XC *xc, Trace::InstRecord *traceData, uint64_t mem,
|
||||||
|
@ -102,6 +151,28 @@ writeMemTiming(XC *xc, Trace::InstRecord *traceData, uint64_t mem,
|
||||||
return xc->writeMem((uint8_t *)&mem, dataSize, addr, flags, res);
|
return xc->writeMem((uint8_t *)&mem, dataSize, addr, flags, res);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
template <class XC, size_t N>
|
||||||
|
Fault
|
||||||
|
writeMemTiming(XC *xc, Trace::InstRecord *traceData,
|
||||||
|
std::array<uint64_t, N> &mem, unsigned dataSize,
|
||||||
|
Addr addr, unsigned flags, uint64_t *res)
|
||||||
|
{
|
||||||
|
assert(dataSize >= 8);
|
||||||
|
assert((dataSize % 8) == 0);
|
||||||
|
|
||||||
|
if (traceData) {
|
||||||
|
traceData->setData(mem[0]);
|
||||||
|
}
|
||||||
|
|
||||||
|
int num_words = dataSize / 8;
|
||||||
|
assert(num_words <= N);
|
||||||
|
|
||||||
|
for (int i = 0; i < num_words; ++i)
|
||||||
|
mem[i] = htog(mem[i]);
|
||||||
|
|
||||||
|
return xc->writeMem((uint8_t *)&mem, dataSize, addr, flags, res);
|
||||||
|
}
|
||||||
|
|
||||||
template <class XC>
|
template <class XC>
|
||||||
Fault
|
Fault
|
||||||
writeMemAtomic(XC *xc, Trace::InstRecord *traceData, uint64_t mem,
|
writeMemAtomic(XC *xc, Trace::InstRecord *traceData, uint64_t mem,
|
||||||
|
@ -119,6 +190,31 @@ writeMemAtomic(XC *xc, Trace::InstRecord *traceData, uint64_t mem,
|
||||||
return fault;
|
return fault;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
template <class XC, size_t N>
|
||||||
|
Fault
|
||||||
|
writeMemAtomic(XC *xc, Trace::InstRecord *traceData,
|
||||||
|
std::array<uint64_t, N> &mem, unsigned dataSize,
|
||||||
|
Addr addr, unsigned flags, uint64_t *res)
|
||||||
|
{
|
||||||
|
if (traceData) {
|
||||||
|
traceData->setData(mem[0]);
|
||||||
|
}
|
||||||
|
|
||||||
|
int num_words = dataSize / 8;
|
||||||
|
assert(num_words <= N);
|
||||||
|
|
||||||
|
for (int i = 0; i < num_words; ++i)
|
||||||
|
mem[i] = htog(mem[i]);
|
||||||
|
|
||||||
|
Fault fault = xc->writeMem((uint8_t *)&mem, dataSize, addr, flags, res);
|
||||||
|
|
||||||
|
if (fault == NoFault && res != NULL) {
|
||||||
|
*res = gtoh(*res);
|
||||||
|
}
|
||||||
|
|
||||||
|
return fault;
|
||||||
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
Loading…
Reference in a new issue