昇腾社区首页
中文
注册
开发者
下载

vcmpvs

功能说明

将向量 src0 逐元素与标量 src1 进行比较,如果比较后的结果为真,则输出结果的对应比特位为1,否则为0。

元素类型为f16时,向量中元素个数为128,因此结果是一个连续的128bit,写入dst中,重复计算时,新的dst = dst + 16Bytes。

元素类型为f32时,向量中元素个数为64,因此结果是一个连续的64bit,写入dst中,重复计算时,新的dst = dst + 8Bytes。

支持多种比较接口:

  • EQ:src0等于src1(equal to)
  • NE:src0不等于src1(not equal to)
  • LT:src0小于src1(less than)
  • GT:src0大于src1(greater than)
  • LE:src0小于或等于src1(less than or equal to)
  • GE:src0大于或等于src1(greater than or equal to)

int32类型只支持eq接口。

该接口无MASK参数。

接口原型

// 相同接口的不同原型区别在于源地址和目的地址的数据类型不同
// vcmpvs_eq 
void vcmpvs_eq(__ubuf__ uint8_t *dst, __ubuf__ half *src0, half src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

void vcmpvs_eq(__ubuf__ uint8_t *dst, __ubuf__ float *src0, float src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

void vcmpvs_eq(__ubuf__ uint8_t *dst, __ubuf__ int32_t *src0, int32_t src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t src0BlockStride, uint16_t dstRepeatStride, uint16_t src0RepeatStride);

// vcmpvs_ne
void vcmpvs_ne(__ubuf__ uint8_t *dst, __ubuf__ half *src0, half src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

void vcmpvs_ne(__ubuf__ uint8_t *dst, __ubuf__ float *src0, float src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

// vcmpvs_lt
void vcmpvs_lt(__ubuf__ uint8_t *dst, __ubuf__ half *src0, half src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

void vcmpvs_lt(__ubuf__ uint8_t *dst, __ubuf__ float *src0, float src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

// vcmpvs_gt
void vcmpvs_gt(__ubuf__ uint8_t *dst, __ubuf__ half *src0, half src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

void vcmpvs_gt(__ubuf__ uint8_t *dst, __ubuf__ float *src0, float src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

// vcmpvs_le
void vcmpvs_le(__ubuf__ uint8_t *dst, __ubuf__ half *src0, half src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

void vcmpvs_le(__ubuf__ uint8_t *dst, __ubuf__ float *src0, float src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

// vcmpvs_ge
void vcmpvs_ge(__ubuf__ uint8_t *dst, __ubuf__ half *src0, half src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

void vcmpvs_ge(__ubuf__ uint8_t *dst, __ubuf__ float *src0, float src1, uint8_t repeat, uint16_t dstBlockStride, uint16_t srcBlockStride, uint16_t dstRepeatStride, uint16_t srcRepeatStride);

参数说明

参数含义见 表1 单目运算参数说明

流水类型

PIPE_V