UnaryRepeatParams
UnaryRepeatParams为用于控制操作数地址步长的数据结构。结构体内包含操作数相邻迭代间相同block的地址步长,操作数同一迭代内不同block的地址步长等参数。
相邻迭代间相同block的地址步长参数的详细说明请参考相邻迭代间相同datablock的地址步长;同一迭代内不同block的地址步长参数请参考同一迭代内不同datablock的地址步长。
结构体具体定义为:
const int32_t DEFAULT_BLK_NUM = 8;
const int32_t DEFAULT_BLK_STRIDE = 1;
const uint8_t DEFAULT_REPEAT_STRIDE = 8;
struct UnaryRepeatParams {
__aicore__ UnaryRepeatParams()
{
blockNumber = DEFAULT_BLK_NUM;
dstBlkStride = DEFAULT_BLK_STRIDE;
srcBlkStride = DEFAULT_BLK_STRIDE;
dstRepStride = DEFAULT_REPEAT_STRIDE;
srcRepStride = DEFAULT_REPEAT_STRIDE;
halfBlock = false;
}
__aicore__ UnaryRepeatParams(const uint16_t dstBlkStrideIn, const uint16_t srcBlkStrideIn,
const uint8_t dstRepStrideIn, const uint8_t srcRepStrideIn)
{
dstBlkStride = dstBlkStrideIn;
srcBlkStride = srcBlkStrideIn;
dstRepStride = dstRepStrideIn;
srcRepStride = srcRepStrideIn;
}
__aicore__ UnaryRepeatParams(const uint16_t dstBlkStrideIn, const uint16_t srcBlkStrideIn,
const uint8_t dstRepStrideIn, const uint8_t srcRepStrideIn, const bool halfBlockIn)
{
dstBlkStride = dstBlkStrideIn;
srcBlkStride = srcBlkStrideIn;
dstRepStride = dstRepStrideIn;
srcRepStride = srcRepStrideIn;
halfBlock = halfBlockIn;
}
uint32_t blockNumber = 0;
uint16_t dstBlkStride = 0;
uint16_t srcBlkStride = 0;
uint8_t dstRepStride = 0;
uint8_t srcRepStride = 0;
bool repeatStrideMode = false;
bool strideSizeMode = false;
bool halfBlock = false;
};
其中,blockNumber,repeatStrideMode,strideSizeMode为保留参数,用户无需关心,使用默认值即可。halfBlock表示CastDeq指令的结果写入对应UB的上半(halfBlock = true)还是下半(halfBlock = false)部分。用户需要自行定义Block stride参数,包含dstBlkStride,srcBlkStride,以及Repeat stride参数,包含dstRepStride,srcRepStride。
父主题: 基础数据结构