21#ifndef _VARITHM_H_INCLUDED_
22#define _VARITHM_H_INCLUDED_
90void nmppsAbs_4s (
const nm4s* pSrcVec,
nm4s* pDstVec,
int nSize);
91void nmppsAbs_8s (
const nm8s* pSrcVec,
nm8s* pDstVec,
int nSize);
92void nmppsAbs_16s(
const nm16s* pSrcVec,
nm16s* pDstVec,
int nSize);
93void nmppsAbs_32s(
const nm32s* pSrcVec,
nm32s* pDstVec,
int nSize);
94void nmppsAbs_64s(
const nm64s* pSrcVec,
nm64s* pDstVec,
int nSize);
147void nmppsAbs1_4s (
const nm4s* pSrcVec,
nm4s* pDstVec,
int nSize);
148void nmppsAbs1_8s (
const nm8s* pSrcVec,
nm8s* pDstVec,
int nSize);
149void nmppsAbs1_16s(
const nm16s* pSrcVec,
nm16s* pDstVec,
int nSize);
150void nmppsAbs1_32s(
const nm32s* pSrcVec,
nm32s* pDstVec,
int nSize);
151void nmppsAbs1_64s(
const nm64s* pSrcVec,
nm64s* pDstVec,
int nSize);
203void nmppsNeg_8s (
const nm8s* pSrcVec,
nm8s* pDstVec,
int nSize);
204void nmppsNeg_16s(
const nm16s* pSrcVec,
nm16s* pDstVec,
int nSize);
205void nmppsNeg_32s(
const nm32s* pSrcVec,
nm32s* pDstVec,
int nSize);
206void nmppsNeg_64s(
const nm64s* pSrcVec,
nm64s* pDstVec,
int nSize);
264void nmppsAddC_8s (
const nm8s* pSrcVec,
int8b nVal,
nm8s* pDstVec,
int nSize);
265void nmppsAddC_16s (
const nm16s* pSrcVec,
int16b nVal,
nm16s* pDstVec,
int nSize);
266void nmppsAddC_32s (
const nm32s* pSrcVec,
int32b nVal,
nm32s* pDstVec,
int nSize);
267void nmppsAddC_64s (
const nm64s* pSrcVec,
int64b nVal,
nm64s* pDstVec,
int nSize);
325void nmppsAddC_p64s(
const nm64s* pSrcVec,
int64b* pnVal,
nm64s* pDstVec,
int nSize);
383 void nmppsAddC_32fcr(
const nm32fcr *pSrcVec,
nm32fcr *pDstVec,
float nVal,
int nSize);
441void nmppsAdd_4s (
const nm4s* pSrcVec1,
const nm4s* pSrcVec2,
nm4s* pDstVec,
int nSize);
442void nmppsAdd_8s (
const nm8s* pSrcVec1,
const nm8s* pSrcVec2,
nm8s* pDstVec,
int nSize);
443void nmppsAdd_16s(
const nm16s* pSrcVec1,
const nm16s* pSrcVec2,
nm16s* pDstVec,
int nSize);
444void nmppsAdd_32s(
const nm32s* pSrcVec1,
const nm32s* pSrcVec2,
nm32s* pDstVec,
int nSize);
445void nmppsAdd_64s(
const nm64s* pSrcVec1,
const nm64s* pSrcVec2,
nm64s* pDstVec,
int nSize);
501void nmppsAdd_32f(
const nm32f* pSrcVec1,
const nm32f* pSrcVec2, nm32f* pDstVec,
int nSize);
557void nmppsAddC_32f (
const nm32f* pSrcVec, nm32f* pDstVec,
float C,
int nSize);
560void nmppsAddEx_64s (
const nm64s *pSrcVec1,
int srcStep1,
const nm64s *pSrcVec2,
int srcStep2,
nm64s *pDstVec,
int dstStep,
int nSize );
632void nmppsAdd_AddC_32s(
nm32s* pSrcVec1,
nm32s* pSrcVec2,
int nVal,
nm32s* pDstVec,
int nSize);
690void nmppsSubC_4s (
const nm4s* pSrcVec,
int4b nVal,
nm4s* pDstVec,
int nSize);
691void nmppsSubC_8s (
const nm8s* pSrcVec,
int8b nVal,
nm8s* pDstVec,
int nSize);
692void nmppsSubC_16s(
const nm16s* pSrcVec,
int16b nVal,
nm16s* pDstVec,
int nSize);
693void nmppsSubC_32s(
const nm32s* pSrcVec,
int32b nVal,
nm32s* pDstVec,
int nSize);
694void nmppsSubC_64s(
const nm64s* pSrcVec,
int64b nVal,
nm64s* pDstVec,
int nSize);
750void nmppsSubC_32f (
const nm32f* pSrcVec, nm32f* pDstVec,
float C,
int nSize);
808void nmppsSubCRev_8s (
const nm8s* pSrcVec,
int8b nVal,
nm8s* pDstVec,
int nSize);
809void nmppsSubCRev_16s(
const nm16s* pSrcVec,
int16b nVal,
nm16s* pDstVec,
int nSize);
810void nmppsSubCRev_32s(
const nm32s* pSrcVec,
int32b nVal,
nm32s* pDstVec,
int nSize);
811void nmppsSubCRev_64s(
const nm64s* pSrcVec,
int64b nVal,
nm64s* pDstVec,
int nSize);
870void nmppsSubCRev_32f (
const nm32f* pSrcVec, nm32f* pDstVec,
float C,
int nSize);
926void nmppsSub_4s (
const nm4s* pSrcVec1,
nm4s* pSrcVec2,
nm4s* pDstVec,
int nSize);
927void nmppsSub_8s (
const nm8s* pSrcVec1,
nm8s* pSrcVec2,
nm8s* pDstVec,
int nSize);
928void nmppsSub_16s(
const nm16s* pSrcVec1,
nm16s* pSrcVec2,
nm16s* pDstVec,
int nSize);
929void nmppsSub_32s(
const nm32s* pSrcVec1,
nm32s* pSrcVec2,
nm32s* pDstVec,
int nSize);
930void nmppsSub_64s(
const nm64s* pSrcVec1,
nm64s* pSrcVec2,
nm64s* pDstVec,
int nSize);
986void nmppsSub_32f(
const nm32f* pSrcVec1,
const nm32f* pSrcVec2, nm32f* pDstVec,
int nSize);
1054void nmppsAbsDiff_8s (
const nm8s* pSrcVec1,
nm8s* pSrcVec2,
nm8s* pDstVec,
int nSize);
1055void nmppsAbsDiff_16s(
const nm16s* pSrcVec1,
nm16s* pSrcVec2,
nm16s* pDstVec,
int nSize);
1056void nmppsAbsDiff_32s(
const nm32s* pSrcVec1,
nm32s* pSrcVec2,
nm32s* pDstVec,
int nSize);
1057void nmppsAbsDiff_64s(
const nm64s* pSrcVec1,
nm64s* pSrcVec2,
nm64s* pDstVec,
int nSize);
1115void nmppsAbsDiff_32f(
const nm32f* pSrcVec1, nm32f* pSrcVec2, nm32f* pDstVec,
int nSize);
1186void nmppsAbsDiff1_8s(
nm8s* pSrcVec1,
nm8s* pSrcVec2,
nm8s* pDstVec,
int nSize);
1243void nmppsMulC_8s (
const nm8s* pSrcVec,
int8b nVal,
nm8s* pDstVec,
int nSize);
1244void nmppsMulC_8s16s (
const nm8s* pSrcVec,
int16b nVal,
nm16s* pDstVec,
int nSize);
1245void nmppsMulC_16s (
const nm16s* pSrcVec,
int16b nVal,
nm16s* pDstVec,
int nSize);
1246void nmppsMulC_16s32s(
const nm16s* pSrcVec,
int32b nVal,
nm32s* pDstVec,
int nSize);
1247void nmppsMulC_32s (
const nm32s* pSrcVec,
int32b nVal,
nm32s* pDstVec,
int nSize);
1248void nmppsMulC_32s64s(
const nm32s* pSrcVec,
int64b nVal,
nm64s* pDstVec,
int nSize);
1249void nmppsMulC_64s (
const nm64s* pSrcVec,
int64b nVal,
nm64s* pDstVec,
int nSize);
1251void nmppsMulC_2s16s (
const nm2s* pSrcVec,
int16b nVal,
nm16s* pDstVec,
int nSize);
1298void nmppsMulC_32f(
const nm32f* pSrcVec, nm32f* pDstVec,
float C,
int nSize);
1356void nmppsMul_Mul_Add_32f(
const nm32f* pSrcVec1,
const nm32f* pSrcVec2,
const nm32f* pSrcVec3,
const nm32f* pSrcVec4, nm32f* pDstVec,
int nSize);
1358void nmppsMul_Mul_Add_64f(
const nm64f *pSrcVec1,
const nm64f *pSrcVec2,
const nm64f *pSrcVec3,
const nm64f *pSrcVec4, nm64f *pDstVec,
int nSize);
1409void nmppsMul_Add_32f(
const nm32f* pSrcVec1,
const nm32f* pSrcVec2,
const nm32f* pSrcVecAdd, nm32f* pDstVec,
int nSize);
1410void nmppsMul_Add_64f(
const nm64f* pSrcVec1,
const nm64f* pSrcVec2,
const nm64f* pSrcVecAdd, nm64f* pDstVec,
int nSize);
1519void nmppsMulC_AddC_32f(
const nm32f* pSrcVec,
float nMulC,
float nAddC, nm32f* pDstVec,
int nSize);
1576void nmppsMulC_AddV_AddC_32f(nm32f* pSrcVec,
float nMulC, nm32f* pVecAdd,
float nAddC, nm32f* pDstVec,
int nSize);
1621void nmppsMul_32f(
const nm32f* pSrcVec1,
const nm32f* pSrcVec2, nm32f* pDstVec,
int nSize);
1667void nmppsConjMul_32fcr(
const nm32fcr *pSrcVec1,
const nm32fcr *pSrcVec2,
nm32fcr *pDstVec,
int nSize);
1724void nmppsMul_Mul_Sub_32f(
const nm32f* pSrcVec1,
const nm32f* pSrcVec2,
const nm32f* pSrcVec3,
const nm32f* pSrcVec4, nm32f* pDstVec,
int nSize);
1771void nmppsMulC_AddV_32f(
const nm32f* pSrcVec1,
const nm32f* pSrcVec2, nm32f* pDstVec,
float C,
int nSize);
1776void nmppsMulC_AddC_2s16s(
const nm2s* pSrcVec,
int32b nMulC,
int nAddC,
nm16s* pDstVec,
int nSize);
1838void nmppsMul_AddC_64s(
const nm64s* pSrcVec1,
const nm64s* pSrcVec2,
const nm64s* pnVal,
nm64s* pDstVec,
int nSize);
1901void nmppsMul_AddC_32f(
const nm32f* pSrcVec1,
const nm32f* pSrcVec2,
float nValueAddC, nm32f* pDstVec,
int nSize);
1963void nmppsMulC_AddC_32s(
const nm32s* pSrcVec,
int nMulVal,
int nAddVal,
nm32s* pDstVec,
int nSize);
2023void nmppsRShiftC_MulC_AddC_2x32s(
int32x2* dataSparseSrc,
int32x2* preshiftArg,
int32x2* mulArg,
int32x2* addArg,
int32x2 *dataSparseDst,
int size,
int stepSparseSrc,
int stepSparseDst);
2093void nmppsMulC_AddV_AddC_32s(
nm32s* pSrcVec1,
int nMulVal,
nm32s* pSrcVec2,
int nAddVal,
nm32s* pDstVec,
int nSize);
2155void nmppsSumN_8s16s(
nm8s ** ppSrcVec,
nm16s* pDstVec,
int nSize,
int nNumberOfVectors);
2156void nmppsSumN_16s (
nm16s ** ppSrcVec,
nm16s* pDstVec,
int nSize,
int nNumberOfVectors);
2256void nmppsDivC_32s(
nm32s* pSrcVec,
int nDivisor,
nm32s* pDstVec,
int nSize,
void* pTmpBuf1,
void* pTmpBuf2);
2308void nmppsSum_8s (
const nm8s* pSrcVec,
int nSize,
int32b *pnRes);
2309void nmppsSum_16s(
const nm16s* pSrcVec,
int nSize,
int64b *pnRes);
2310void nmppsSum_32s(
const nm32s* pSrcVec,
int nSize,
int64b *pnRes);
2311void nmppsSum_64s(
const nm64s* pSrcVec,
int nSize,
int64b *pnRes);
2365void nmppsSum_1 (
const nm1* pSrcVec,
int nSize,
int32b* pnRes,
void* pTmpBuf);
2440int nmppsDotProd_8s8sm (
const nm8s* pSrcVec1,
const nm8s* pSrcVec2,
int nSize,
int64b* pnRes,
nm64s* tmp);
2441int nmppsDotProd_8s16sm (
const nm8s* pSrcVec1,
const nm16s* pSrcVec2,
int nSize,
int64b* pnRes,
nm64s* tmp);
2442int nmppsDotProd_8s32sm (
const nm8s* pSrcVec1,
const nm32s* pSrcVec2,
int nSize,
int64b* pnRes,
nm64s* tmp);
2443int nmppsDotProd_16s16sm(
const nm16s* pSrcVec1,
const nm16s* pSrcVec2,
int nSize,
int64b* pnRes,
nm64s* tmp);
2444int nmppsDotProd_16s32sm(
const nm16s* pSrcVec1,
const nm32s* pSrcVec2,
int nSize,
int64b* pnRes,
nm64s* tmp);
2445int nmppsDotProd_32s32sm(
const nm32s* pSrcVec1,
const nm32s* pSrcVec2,
int nSize,
int64b* pnRes,
nm64s* tmp);
2500void nmppsDotProd_8s64s (
const nm8s* pSrcVec1,
const nm64s* pSrcVec2,
int nSize,
int64b* pnRes);
2501void nmppsDotProd_16s64s (
const nm16s* pSrcVec1,
const nm64s* pSrcVec2,
int nSize,
int64b* pnRes);
2502void nmppsDotProd_32s64s (
const nm32s* pSrcVec1,
const nm64s* pSrcVec2,
int nSize,
int64b* pnRes);
2503void nmppsDotProd_64s64s (
const nm64s* pSrcVec1,
const nm64s* pSrcVec2,
int nSize,
int64b* pnRes);
2574void nmppsWeightedSum_8s16s(
nm8s* pSrcVec1,
int nW1,
nm8s* pSrcVec2,
int nW2,
nm16s* pDstVec,
int nSize);
2575void nmppsWeightedSum_16s32s(
nm16s* pSrcVec1,
int nW1,
nm16s* pSrcVec2,
int nW2,
nm32s* pDstVec,
int nSize);
2579void nmppsMulC_Add_32fcr(
const nm32fcr* pSrcVec1,
const nm32fcr* pSrcVec2,
nm32fcr* pDstVec,
float C,
int nSize);
void nmppsMulC_AddC_2x32s(int32x2 *dataSparseSrc, int32x2 *mulArg, int32x2 *addArg, int32x2 *dataSparseDst, int size, int stepSparseSrc, int stepSparseDst)
Sparse vector by constant multiplication with addition of constant.
int int4b
Definition: nmtype.h:592
int int8b
Definition: nmtype.h:618
int int32b
Definition: nmtype.h:683
int int16b
Definition: nmtype.h:644
INT64 int64b
Definition: nmtype.h:709
int nm32s
Definition: nmtype.h:292
long long nm64s
Definition: nmtype.h:375
void nm2s
Definition: nmtype.h:116
int nm1
Definition: nmtype.h:100
short nm16s
Definition: nmtype.h:243
void nm4s
Definition: nmtype.h:129
char nm8s
Definition: nmtype.h:167
Definition: nmtype.h:1335
Definition: nmtype.h:1364