|
Poplar and PopLibs
|
IPU intrinsic functions. More...
Functions | |
| int | andc (int src0, int src1) |
Targets the andc instruction. More... | |
| unsigned | andc (unsigned src0, unsigned src1) |
Targets the andc instruction. More... | |
| float | andc (float src0, float src1) |
Targets the andc instruction. More... | |
| float2 | andc (float2 src0, float2 src1) |
Targets the andc64 instruction. More... | |
| int | bitrev8 (int src) |
Targets the bitrev8 instruction. More... | |
| unsigned | cms (int src) |
Targets the cms instruction. More... | |
| float2 | roll32 (float2 src0, float2 src1) |
Targets the roll32 instruction. More... | |
| int | roll8l (int src0, int src1) |
Targets the roll8l instruction. More... | |
| int | roll8r (int src0, int src1) |
Targets the roll8r instruction. More... | |
| int | shuf8x8hi (int src0, int src1) |
Targets the shuf8x8hi instruction. More... | |
| int | shuf8x8lo (int src0, int src1) |
Targets the shuf8x8lo instruction. More... | |
| float2 | sort4x32hi (float2 src0, float2 src1) |
Targets the sort4x32hi instruction. More... | |
| float2 | sort4x32lo (float2 src0, float2 src1) |
Targets the sort4x32lo instruction. More... | |
| int | sort8 (int src) |
Targets the sort8 instruction. More... | |
| int | sort8x8hi (int src0, int src1) |
Targets the sort8x8hi instruction. More... | |
| int | sort8x8lo (int src0, int src1) |
Targets the sort8x8lo instruction. More... | |
| int | swap8 (int src) |
Targets the sort8 instruction. More... | |
| half2 | absadd (half2 src0, half2 src1) |
Targets the f16v2absadd instruction. More... | |
| half4 | absadd (half4 src0, half4 src1) |
Targets the f16v4absadd instruction. More... | |
| float2 | absadd (float2 src0, float2 src1) |
Targets the f32v2absadd instruction. More... | |
| float | absadd (float src0, float src1) |
Targets the f32absadd instruction. More... | |
| half2 | absmax (half2 src0, half2 src1) |
Targets the f16v2absmax instruction. More... | |
| half4 | absmax (half4 src0, half4 src1) |
Targets the f16v4absmax instruction. More... | |
| float2 | absmax (float2 src0, float2 src1) |
Targets the f32v2absmax instruction. More... | |
| float | absmax (float src0, float src1) |
Targets the f32absmax instruction. More... | |
| half2 | max (half2 src0, half2 src1) |
Targets the f16v2max instruction. More... | |
| half4 | max (half4 src0, half4 src1) |
Targets the f16v4max instruction. More... | |
| float2 | max (float2 src0, float2 src1) |
Targets the f32v2max instruction. More... | |
| float | max (float src0, float src1) |
Targets the f32max instruction. More... | |
| half2 | maxc (half4 src) |
Targets the f16v4maxc instruction. More... | |
| half2 | min (half2 src0, half2 src1) |
Targets the f16v2min instruction. More... | |
| half4 | min (half4 src0, half4 src1) |
Targets the f16v4min instruction. More... | |
| float2 | min (float2 src0, float2 src1) |
Targets the f32v2min instruction. More... | |
| float | min (float src0, float src1) |
Targets the f32min instruction. More... | |
| half2 | clamp (half2 src0, half2 src1) |
Targets the f16v2clamp instruction. More... | |
| half4 | clamp (half4 src0, half2 src1) |
Targets the f16v4clamp instruction. More... | |
| float2 | clamp (float2 src0, float2 src1) |
Targets the f32v2clamp instruction. More... | |
| float | clamp (float src0, float2 src1) |
Targets the f32clamp instruction. More... | |
| void | cmac (half2 src0, half2 src1) |
Targets the f16v2cmac instruction. More... | |
| void | cmac (half4 src0, half4 src1) |
Targets the f16v4cmac instruction. More... | |
| half2 | exp (half2 src) |
Targets the f16v2exp instruction. More... | |
| float | exp (float src) |
Targets the f32exp instruction. More... | |
| half2 | exp2 (half2 src) |
Targets the f16v2exp instruction. More... | |
| float | exp2 (float src) |
Targets the f32exp instruction. More... | |
| half2 | log2 (half2 src) |
Targets the f16v2log2 instruction. More... | |
| float | log2 (float src) |
Targets the f32ln instruction. More... | |
| half2 | tanh (half2 src) |
Targets the f16v2tanh instruction. More... | |
| float | tanh (float src) |
Targets the f32tanh instruction. More... | |
| half2 | ln (half2 src) |
Targets the f16v2ln instruction. More... | |
| float | ln (float src) |
Targets the f32ln instruction. More... | |
| float2 | axpy (float2 src0, float2 src1) |
Targets the f32v2axpy instruction. More... | |
| half2 | f16v2grand () |
Targets the f16v2grand instruction. More... | |
| float2 | f32v2grand () |
Targets the f32v2grand instruction. More... | |
| half4 | rmask (half4 src0, float src1) |
Targets the f16v4rmask instruction. More... | |
| float2 | rmask (float2 src0, float src1) |
Targets the f32v2rmask instruction. More... | |
| half2 | sigm (half2 src) |
Targets the f16v2sigm instruction. More... | |
| float | sigm (float src) |
Targets the f32sigm instruction. More... | |
| float | sum (half2 src) |
Targets the f16v2sum instruction. More... | |
| float2 | sum (half4 src) |
Targets the f16v4sum instruction. More... | |
| half2 | cmpeq (half2 src0, half2 src1) |
Targets the f16v2cmpeq instruction. More... | |
| half4 | cmpeq (half4 src0, half4 src1) |
Targets the f16v4cmpeq instruction. More... | |
| float2 | cmpeq (float2 src0, float2 src1) |
Targets the f32v2cmpeq instruction. More... | |
| float | cmpeq (float src0, float src1) |
Targets the f32cmpeq instruction. More... | |
| half2 | cmpge (half2 src0, half2 src1) |
Targets the f16v2cmpge instruction. More... | |
| half4 | cmpge (half4 src0, half4 src1) |
Targets the f16v4cmpge instruction. More... | |
| float2 | cmpge (float2 src0, float2 src1) |
Targets the f32v2cmpge instruction. More... | |
| float | cmpge (float src0, float src1) |
Targets the f32cmpge instruction. More... | |
| half2 | cmpgt (half2 src0, half2 src1) |
Targets the f16v2cmpgt instruction. More... | |
| half4 | cmpgt (half4 src0, half4 src1) |
Targets the f16v4cmpgt instruction. More... | |
| float2 | cmpgt (float2 src0, float2 src1) |
Targets the f32v2cmpgt instruction. More... | |
| float | cmpgt (float src0, float src1) |
Targets the f32cmpgt instruction. More... | |
| half2 | cmple (half2 src0, half2 src1) |
Targets the f16v2cmple instruction. More... | |
| half4 | cmple (half4 src0, half4 src1) |
Targets the f16v4cmple instruction. More... | |
| float2 | cmple (float2 src0, float2 src1) |
Targets the f32v2cmple instruction. More... | |
| float | cmple (float src0, float src1) |
Targets the f32cmple instruction. More... | |
| half2 | cmplt (half2 src0, half2 src1) |
Targets the f16v2cmplt instruction. More... | |
| half4 | cmplt (half4 src0, half4 src1) |
Targets the f16v4cmplt instruction. More... | |
| float2 | cmplt (float2 src0, float2 src1) |
Targets the f32v2cmplt instruction. More... | |
| float | cmplt (float src0, float src1) |
Targets the f32cmplt instruction. More... | |
| half2 | cmpne (half2 src0, half2 src1) |
Targets the f16v2cmpne instruction. More... | |
| half4 | cmpne (half4 src0, half4 src1) |
Targets the f16v4cmpne instruction. More... | |
| float2 | cmpne (float2 src0, float2 src1) |
Targets the f32v2cmpne instruction. More... | |
| float | cmpne (float src0, float src1) |
Targets the f32cmpne instruction. More... | |
| unsigned | clz (int src) |
Targets the clz instruction. More... | |
| unsigned | popc (int src) |
Targets the popc instruction. More... | |
| short2 | roll16 (short2 src0, short2 src1) |
Targets the roll16 instruction. More... | |
| ushort2 | roll16 (ushort2 src0, ushort2 src1) |
Targets the roll16 instruction. More... | |
| half2 | roll16 (half2 src0, half2 src1) |
Targets the roll16 instruction. More... | |
| short2 | sort4x16hi (short2 src0, short2 src1) |
Targets the sort4x16hi instruction. More... | |
| ushort2 | sort4x16hi (ushort2 src0, ushort2 src1) |
Targets the sort4x16hi instruction. More... | |
| half2 | sort4x16hi (half2 src0, half2 src1) |
Targets the sort4x16hi instruction. More... | |
| short2 | sort4x16lo (short2 src0, short2 src1) |
Targets the sort4x16lo instruction. More... | |
| ushort2 | sort4x16lo (ushort2 src0, ushort2 src1) |
Targets the sort4x16lo instruction. More... | |
| half2 | sort4x16lo (half2 src0, half2 src1) |
Targets the sort4x16lo instruction. More... | |
| half | load_postinc (const half **a, int i) |
Post-incrementing load, targeting the ldb16step instruction. More... | |
| void | store_postinc (half2 **a, half2 v, int i) |
Post-incrementing store, targeting the st32step instruction. More... | |
| half2 | load_postinc (const half2 **a, int i) |
Post-incrementing load, targeting the ld32step instruction. More... | |
| void | store_postinc (half4 **a, half4 v, int i) |
Post-incrementing store, targeting the st64step instruction. More... | |
| half4 | load_postinc (const half4 **a, int i) |
Post-incrementing load, targeting the ld64step instruction. More... | |
| void | store_postinc (float **a, float v, int i) |
Post-incrementing store, targeting the st32step instruction. More... | |
| float | load_postinc (const float **a, int i) |
Post-incrementing load, targeting the ld32step instruction. More... | |
| void | store_postinc (float2 **a, float2 v, int i) |
Post-incrementing store, targeting the st64step instruction. More... | |
| float2 | load_postinc (const float2 **a, int i) |
Post-incrementing load, targeting the ld64step instruction. More... | |
| void | store_postinc (int **a, int v, int i) |
Post-incrementing store, targeting the stm32step instruction if i is a variable stride, and st32step otherwise. More... | |
| int | load_postinc (const int **a, int i) |
Post-incrementing load, targeting the ld32step instruction. More... | |
| void | store_postinc (unsigned **a, unsigned v, int i) |
Post-incrementing store, targeting the stm32step instruction if i is a variable stride, and st32step otherwise. More... | |
| unsigned | load_postinc (const unsigned **a, int i) |
Post-incrementing load, targeting the ld32step instruction. More... | |
| void | store_postinc (int2 **a, int2 v, int i) |
| Post-incrementing store. More... | |
| int2 | load_postinc (const int2 **a, int i) |
| Post-incrementing load. More... | |
| void | store_postinc (uint2 **a, uint2 v, int i) |
| Post-incrementing store. More... | |
| uint2 | load_postinc (const uint2 **a, int i) |
| Post-incrementing load. More... | |
| void | store_postinc (short **a, short v, int i) |
| Post-incrementing store. More... | |
| short | load_postinc (const short **a, int i) |
Post-incrementing load, targeting the lds16step instruction. More... | |
| void | store_postinc (unsigned short **a, unsigned short v, int i) |
| Post-incrementing store. More... | |
| unsigned short | load_postinc (const unsigned short **a, int i) |
Post-incrementing load, targeting the ldz16step instruction. More... | |
| void | store_postinc (short2 **a, short2 v, int i) |
Post-incrementing store, targeting the stm32step instruction if i is a variable stride, and st32step otherwise. More... | |
| short2 | load_postinc (const short2 **a, int i) |
Post-incrementing load, targeting the ld32step instruction. More... | |
| void | store_postinc (ushort2 **a, ushort2 v, int i) |
Post-incrementing store, targeting the stm32step instruction if i is a variable stride, and st32step otherwise. More... | |
| ushort2 | load_postinc (const ushort2 **a, int i) |
Post-incrementing load, targeting the ld32step instruction. More... | |
| void | store_postinc (short4 **a, short4 v, int i) |
| Post-incrementing store. More... | |
| short4 | load_postinc (const short4 **a, int i) |
| Post-incrementing load. More... | |
| void | store_postinc (ushort4 **a, ushort4 v, int i) |
| Post-incrementing store. More... | |
| ushort4 | load_postinc (const ushort4 **a, int i) |
| Post-incrementing load. More... | |
| void | store_postinc (char **a, char v, int i) |
| Post-incrementing store. More... | |
| char | load_postinc (const char **a, int i) |
Post-incrementing load, targeting the lds8step instruction. More... | |
| void | store_postinc (unsigned char **a, unsigned char v, int i) |
| Post-incrementing store. More... | |
| unsigned char | load_postinc (const unsigned char **a, int i) |
Post-incrementing load, targeting the ldz8step instruction. More... | |
| float | acos (float x) |
| The arccos function, the inverse of cosine. More... | |
| float2 | acos (float2 x) |
| The arccos function, the inverse of cosine. More... | |
| half | acos (half x) |
| The arccos function, the inverse of cosine. More... | |
| half2 | acos (half2 x) |
| The arccos function, the inverse of cosine. More... | |
| half4 | acos (half4 x) |
| The arccos function, the inverse of cosine. More... | |
| float | acosh (float x) |
| The arccosh function, the inverse of the hyperbolic cosine. More... | |
| float2 | acosh (float2 x) |
| The arccosh function, the inverse of the hyperbolic cosine. More... | |
| half | acosh (half x) |
| The arccosh function, the inverse of the hyperbolic cosine. More... | |
| half2 | acosh (half2 x) |
| The arccosh function, the inverse of the hyperbolic cosine. More... | |
| half4 | acosh (half4 x) |
| The arccosh function, the inverse of the hyperbolic cosine. More... | |
| float | asin (float x) |
| The arcsin function, the inverse of sine. More... | |
| float2 | asin (float2 x) |
| The arcsin function, the inverse of sine. More... | |
| half | asin (half x) |
| The arcsin function, the inverse of sine. More... | |
| half2 | asin (half2 x) |
| The arcsin function, the inverse of sine. More... | |
| half4 | asin (half4 x) |
| The arcsin function, the inverse of sine. More... | |
| float | asinh (float x) |
| The arcsinh function, the inverse of the hyperbolic sine. More... | |
| float2 | asinh (float2 x) |
| The arcsinh function, the inverse of the hyperbolic sine. More... | |
| half | asinh (half x) |
| The arcsinh function, the inverse of the hyperbolic sine. More... | |
| half2 | asinh (half2 x) |
| The arcsinh function, the inverse of the hyperbolic sine. More... | |
| half4 | asinh (half4 x) |
| The arcsinh function, the inverse of the hyperbolic sine. More... | |
| float | atan (float x) |
| The arctan function, the inverse of tangent. More... | |
| float2 | atan (float2 x) |
| The arctan function, the inverse of tangent. More... | |
| half | atan (half x) |
| The arctan function, the inverse of tangent. More... | |
| half2 | atan (half2 x) |
| The arctan function, the inverse of tangent. More... | |
| half4 | atan (half4 x) |
| The arctan function, the inverse of tangent. More... | |
| float | atanh (float x) |
| The arctanh function, the inverse of the hyperbolic tangent. More... | |
| float2 | atanh (float2 x) |
| The arctanh function, the inverse of the hyperbolic tangent. More... | |
| half | atanh (half x) |
| The arctanh function, the inverse of the hyperbolic tangent. More... | |
| half2 | atanh (half2 x) |
| The arctanh function, the inverse of the hyperbolic tangent. More... | |
| half4 | atanh (half4 x) |
| The arctanh function, the inverse of the hyperbolic tangent. More... | |
| float | cbrt (float x) |
| The cubic root function. More... | |
| float2 | cbrt (float2 x) |
| The cubic root function. More... | |
| half | cbrt (half x) |
| The cubic root function. More... | |
| half2 | cbrt (half2 x) |
| The cubic root function. More... | |
| half4 | cbrt (half4 x) |
| The cubic root function. More... | |
| float | ceil (float x) |
| Rounds up input to the closest integral value. More... | |
| float2 | ceil (float2 x) |
| Rounds up input to the closest integral value. More... | |
| half | ceil (half x) |
| Rounds up input to the closest integral value. More... | |
| half2 | ceil (half2 x) |
| Rounds up input to the closest integral value. More... | |
| half4 | ceil (half4 x) |
| Rounds up input to the closest integral value. More... | |
| float | cos (float x) |
| The trigonometric cosine function. More... | |
| float2 | cos (float2 x) |
| The trigonometric cosine function. More... | |
| half | cos (half x) |
| The trigonometric cosine function. More... | |
| half2 | cos (half2 x) |
| The trigonometric cosine function. More... | |
| half4 | cos (half4 x) |
| The trigonometric cosine function. More... | |
| float | cosh (float x) |
| The hyperbolic cosine function. More... | |
| float2 | cosh (float2 x) |
| The hyperbolic cosine function. More... | |
| half | cosh (half x) |
| The hyperbolic cosine function. More... | |
| half2 | cosh (half2 x) |
| The hyperbolic cosine function. More... | |
| half4 | cosh (half4 x) |
| The hyperbolic cosine function. More... | |
| float | erf (float x) |
| The error function. More... | |
| float2 | erf (float2 x) |
| The error function. More... | |
| half | erf (half x) |
| The error function. More... | |
| half2 | erf (half2 x) |
| The error function. More... | |
| half4 | erf (half4 x) |
| The error function. More... | |
| float | erfc (float x) |
| The complementary error function. More... | |
| float2 | erfc (float2 x) |
| The complementary error function. More... | |
| half | erfc (half x) |
| The complementary error function. More... | |
| half2 | erfc (half2 x) |
| The complementary error function. More... | |
| half4 | erfc (half4 x) |
| The complementary error function. More... | |
| float2 | exp (float2 x) |
| The base-e exponential function. More... | |
| half | exp (half x) |
| The base-e exponential function. More... | |
| half4 | exp (half4 x) |
| The base-e exponential function. More... | |
| float2 | exp2 (float2 x) |
| The base-2 exponential function. More... | |
| half | exp2 (half x) |
| The base-2 exponential function. More... | |
| half4 | exp2 (half4 x) |
| The base-2 exponential function. More... | |
| float | expm1 (float x) |
The base-e exponential function, minus one: exp(x) - 1. More... | |
| float2 | expm1 (float2 x) |
The base-e exponential function, minus one: exp(x) - 1. More... | |
| half | expm1 (half x) |
The base-e exponential function, minus one: exp(x) - 1. More... | |
| half2 | expm1 (half2 x) |
The base-e exponential function, minus one: exp(x) - 1. More... | |
| half4 | expm1 (half4 x) |
The base-e exponential function, minus one: exp(x) - 1. More... | |
| float | fabs (float x) |
| Computes the absolute value of the input. More... | |
| float2 | fabs (float2 x) |
| Computes the absolute value of the input. More... | |
| half | fabs (half x) |
| Computes the absolute value of the input. More... | |
| half2 | fabs (half2 x) |
| Computes the absolute value of the input. More... | |
| half4 | fabs (half4 x) |
| Computes the absolute value of the input. More... | |
| float | floor (float x) |
| Rounds down input to the closest integral value. More... | |
| float2 | floor (float2 x) |
| Rounds down input to the closest integral value. More... | |
| half | floor (half x) |
| Rounds down input to the closest integral value. More... | |
| half2 | floor (half2 x) |
| Rounds down input to the closest integral value. More... | |
| half4 | floor (half4 x) |
| Rounds down input to the closest integral value. More... | |
| float | log (float x) |
| The natural logarithm. More... | |
| float2 | log (float2 x) |
| The natural logarithm. More... | |
| half | log (half x) |
| The natural logarithm. More... | |
| half2 | log (half2 x) |
| The natural logarithm. More... | |
| half4 | log (half4 x) |
| The natural logarithm. More... | |
| float | log10 (float x) |
| The base-10 logarithm. More... | |
| float2 | log10 (float2 x) |
| The base-10 logarithm. More... | |
| half | log10 (half x) |
| The base-10 logarithm. More... | |
| half2 | log10 (half2 x) |
| The base-10 logarithm. More... | |
| half4 | log10 (half4 x) |
| The base-10 logarithm. More... | |
| float | log1p (float x) |
The natural logarithm of 1 + x. More... | |
| float2 | log1p (float2 x) |
The natural logarithm of 1 + x. More... | |
| half | log1p (half x) |
The natural logarithm of 1 + x. More... | |
| half2 | log1p (half2 x) |
The natural logarithm of 1 + x. More... | |
| half4 | log1p (half4 x) |
The natural logarithm of 1 + x. More... | |
| float2 | log2 (float2 x) |
| The base-2 logarithm. More... | |
| half | log2 (half x) |
| The base-2 logarithm. More... | |
| half4 | log2 (half4 x) |
| The base-2 logarithm. More... | |
| float | nearbyint (float x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| float2 | nearbyint (float2 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| half | nearbyint (half x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| half2 | nearbyint (half2 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| half4 | nearbyint (half4 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| float | rint (float x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| float2 | rint (float2 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| half | rint (half x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| half2 | rint (half2 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| half4 | rint (half4 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| float | round (float x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| float2 | round (float2 x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| half | round (half x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| half2 | round (half2 x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| half4 | round (half4 x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| float | sin (float x) |
| The trigonometric sine function. More... | |
| float2 | sin (float2 x) |
| The trigonometric sine function. More... | |
| half | sin (half x) |
| The trigonometric sine function. More... | |
| half2 | sin (half2 x) |
| The trigonometric sine function. More... | |
| half4 | sin (half4 x) |
| The trigonometric sine function. More... | |
| float | sinh (float x) |
| The hyperbolic sine function. More... | |
| float2 | sinh (float2 x) |
| The hyperbolic sine function. More... | |
| half | sinh (half x) |
| The hyperbolic sine function. More... | |
| half2 | sinh (half2 x) |
| The hyperbolic sine function. More... | |
| half4 | sinh (half4 x) |
| The hyperbolic sine function. More... | |
| float | sqrt (float x) |
| The square root function. More... | |
| float2 | sqrt (float2 x) |
| The square root function. More... | |
| half | sqrt (half x) |
| The square root function. More... | |
| half2 | sqrt (half2 x) |
| The square root function. More... | |
| half4 | sqrt (half4 x) |
| The square root function. More... | |
| float | rsqrt (float x) |
| The reciprocal square root function. More... | |
| float2 | rsqrt (float2 x) |
| The reciprocal square root function. More... | |
| half | rsqrt (half x) |
| The reciprocal square root function. More... | |
| half2 | rsqrt (half2 x) |
| The reciprocal square root function. More... | |
| half4 | rsqrt (half4 x) |
| The reciprocal square root function. More... | |
| float | tan (float x) |
| The trigonometric tangent function. More... | |
| float2 | tan (float2 x) |
| The trigonometric tangent function. More... | |
| half | tan (half x) |
| The trigonometric tangent function. More... | |
| half2 | tan (half2 x) |
| The trigonometric tangent function. More... | |
| half4 | tan (half4 x) |
| The trigonometric tangent function. More... | |
| float2 | tanh (float2 x) |
| The hyperbolic tangent function. More... | |
| half | tanh (half x) |
| The hyperbolic tangent function. More... | |
| half4 | tanh (half4 x) |
| The hyperbolic tangent function. More... | |
| float | tgamma (float x) |
| The gamma function. More... | |
| float2 | tgamma (float2 x) |
| The gamma function. More... | |
| half | tgamma (half x) |
| The gamma function. More... | |
| half2 | tgamma (half2 x) |
| The gamma function. More... | |
| half4 | tgamma (half4 x) |
| The gamma function. More... | |
| float | trunc (float x) |
Rounds input towards zero to the nearest integral value that is not larger in magnitude than x. More... | |
| float2 | trunc (float2 x) |
Rounds input towards zero to the nearest integral value that is not larger in magnitude than x. More... | |
| half | trunc (half x) |
Rounds input towards zero to the nearest integral value that is not larger in magnitude than x. More... | |
| half2 | trunc (half2 x) |
Rounds input towards zero to the nearest integral value that is not larger in magnitude than x. More... | |
| half4 | trunc (half4 x) |
Rounds input towards zero to the nearest integral value that is not larger in magnitude than x. More... | |
| float | sigmoid (float x) |
The sigmoid function, ie 1/(1 + exp(- x )). More... | |
| float2 | sigmoid (float2 x) |
The sigmoid function, ie 1/(1 + exp(- x )). More... | |
| half | sigmoid (half x) |
The sigmoid function, ie 1/(1 + exp(- x )). More... | |
| half2 | sigmoid (half2 x) |
The sigmoid function, ie 1/(1 + exp(- x )). More... | |
| half4 | sigmoid (half4 x) |
The sigmoid function, ie 1/(1 + exp(- x )). More... | |
| float | atan2 (float x, float y) |
The arctangent of ( y )/( x ), in radians. More... | |
| float2 | atan2 (float2 x, float2 y) |
The arctangent of ( y )/( x ), in radians. More... | |
| half | atan2 (half x, half y) |
The arctangent of ( y )/( x ), in radians. More... | |
| half2 | atan2 (half2 x, half2 y) |
The arctangent of ( y )/( x ), in radians. More... | |
| half4 | atan2 (half4 x, half4 y) |
The arctangent of ( y )/( x ), in radians. More... | |
| float | copysign (float x, float y) |
Composes a value of magnitude x with the sign of y. More... | |
| float2 | copysign (float2 x, float2 y) |
Composes a value of magnitude x with the sign of y. More... | |
| half | copysign (half x, half y) |
Composes a value of magnitude x with the sign of y. More... | |
| half2 | copysign (half2 x, half2 y) |
Composes a value of magnitude x with the sign of y. More... | |
| half4 | copysign (half4 x, half4 y) |
Composes a value of magnitude x with the sign of y. More... | |
| float | fdim (float x, float y) |
| Calculates the absolute difference between the two inputs. More... | |
| float2 | fdim (float2 x, float2 y) |
| Calculates the absolute difference between the two inputs. More... | |
| half | fdim (half x, half y) |
| Calculates the absolute difference between the two inputs. More... | |
| half2 | fdim (half2 x, half2 y) |
| Calculates the absolute difference between the two inputs. More... | |
| half4 | fdim (half4 x, half4 y) |
| Calculates the absolute difference between the two inputs. More... | |
| float | fmax (float x, float y) |
| Calculates the maximum of the two inputs. More... | |
| float2 | fmax (float2 x, float2 y) |
| Calculates the maximum of the two inputs. More... | |
| half | fmax (half x, half y) |
| Calculates the maximum of the two inputs. More... | |
| half2 | fmax (half2 x, half2 y) |
| Calculates the maximum of the two inputs. More... | |
| half4 | fmax (half4 x, half4 y) |
| Calculates the maximum of the two inputs. More... | |
| float | fmin (float x, float y) |
| Calculates the minimum of the two inputs. More... | |
| float2 | fmin (float2 x, float2 y) |
| Calculates the minimum of the two inputs. More... | |
| half | fmin (half x, half y) |
| Calculates the minimum of the two inputs. More... | |
| half2 | fmin (half2 x, half2 y) |
| Calculates the minimum of the two inputs. More... | |
| half4 | fmin (half4 x, half4 y) |
| Calculates the minimum of the two inputs. More... | |
| float | fmod (float x, float y) |
Calculates the remainder of the division x / y rounded towards zero. More... | |
| float2 | fmod (float2 x, float2 y) |
Calculates the remainder of the division x / y rounded towards zero. More... | |
| half | fmod (half x, half y) |
Calculates the remainder of the division x / y rounded towards zero. More... | |
| half2 | fmod (half2 x, half2 y) |
Calculates the remainder of the division x / y rounded towards zero. More... | |
| half4 | fmod (half4 x, half4 y) |
Calculates the remainder of the division x / y rounded towards zero. More... | |
| float | hypot (float x, float y) |
| Calculates the hypotenuse of the right-angled triangle whose two shorter sides are of lengths given by the two inputs. More... | |
| float2 | hypot (float2 x, float2 y) |
| Calculates the hypotenuse of the right-angled triangle whose two shorter sides are of lengths given by the two inputs. More... | |
| half | hypot (half x, half y) |
| Calculates the hypotenuse of the right-angled triangle whose two shorter sides are of lengths given by the two inputs. More... | |
| half2 | hypot (half2 x, half2 y) |
| Calculates the hypotenuse of the right-angled triangle whose two shorter sides are of lengths given by the two inputs. More... | |
| half4 | hypot (half4 x, half4 y) |
| Calculates the hypotenuse of the right-angled triangle whose two shorter sides are of lengths given by the two inputs. More... | |
| float | pow (float x, float y) |
Calculates x to the power of y. More... | |
| float2 | pow (float2 x, float2 y) |
Calculates x to the power of y. More... | |
| half | pow (half x, half y) |
Calculates x to the power of y. More... | |
| half2 | pow (half2 x, half2 y) |
Calculates x to the power of y. More... | |
| half4 | pow (half4 x, half4 y) |
Calculates x to the power of y. More... | |
| float | remainder (float x, float y) |
Calculates the remainder of the division x / y, rounded to the nearest integral value, with halfway cases rounded to the even number. More... | |
| float2 | remainder (float2 x, float2 y) |
Calculates the remainder of the division x / y, rounded to the nearest integral value, with halfway cases rounded to the even number. More... | |
| half | remainder (half x, half y) |
Calculates the remainder of the division x / y, rounded to the nearest integral value, with halfway cases rounded to the even number. More... | |
| half2 | remainder (half2 x, half2 y) |
Calculates the remainder of the division x / y, rounded to the nearest integral value, with halfway cases rounded to the even number. More... | |
| half4 | remainder (half4 x, half4 y) |
Calculates the remainder of the division x / y, rounded to the nearest integral value, with halfway cases rounded to the even number. More... | |
| float | fma (float x, float y, float z) |
Computes ( x * y ) + z. More... | |
| float2 | fma (float2 x, float2 y, float2 z) |
Computes ( x * y ) + z. More... | |
| half | fma (half x, half y, half z) |
Computes ( x * y ) + z. More... | |
| half2 | fma (half2 x, half2 y, half2 z) |
Computes ( x * y ) + z. More... | |
| half4 | fma (half4 x, half4 y, half4 z) |
Computes ( x * y ) + z. More... | |
| long long | llrint (float x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| longlong2 | llrint (float2 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| long long | llrint (half x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| longlong2 | llrint (half2 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| longlong4 | llrint (half4 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| long long | llround (float x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| longlong2 | llround (float2 x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| long long | llround (half x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| longlong2 | llround (half2 x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| longlong4 | llround (half4 x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| long | lrint (float x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| long2 | lrint (float2 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| long | lrint (half x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| long2 | lrint (half2 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| long4 | lrint (half4 x) |
| Rounds input to a nearby integral value, using the current rounding mode. More... | |
| long | lround (float x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| long2 | lround (float2 x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| long | lround (half x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| long2 | lround (half2 x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
| long4 | lround (half4 x) |
| Rounds input to nearest integral value, with halfway cases rounded away from zero. More... | |
IPU intrinsic functions.
|
inline |
Targets the f32absadd instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
src0 and src1.
|
inline |
Targets the f32v2absadd instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1.
|
inline |
Targets the f16v2absadd instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1.
|
inline |
Targets the f16v4absadd instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
src0 and src1.
|
inline |
Targets the f32absmax instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
src0 and src1.
|
inline |
Targets the f32v2absmax instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1.
|
inline |
Targets the f16v2absmax instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1.
|
inline |
Targets the f16v4absmax instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
src0 and src1.
|
inline |
The arccos function, the inverse of cosine.
| x | A value of type float. |
acos of x.
|
inline |
The arccos function, the inverse of cosine.
| x | A value of type float2. |
acos of x.
|
inline |
The arccos function, the inverse of cosine.
| x | A value of type half. |
acos of x.
|
inline |
The arccos function, the inverse of cosine.
| x | A value of type half2. |
acos of x.
|
inline |
The arccos function, the inverse of cosine.
| x | A value of type half4. |
acos of x.
|
inline |
The arccosh function, the inverse of the hyperbolic cosine.
| x | A value of type float. |
acosh of x.
|
inline |
The arccosh function, the inverse of the hyperbolic cosine.
| x | A value of type float2. |
acosh of x.
|
inline |
The arccosh function, the inverse of the hyperbolic cosine.
| x | A value of type half. |
acosh of x.
|
inline |
The arccosh function, the inverse of the hyperbolic cosine.
| x | A value of type half2. |
acosh of x.
|
inline |
The arccosh function, the inverse of the hyperbolic cosine.
| x | A value of type half4. |
acosh of x.
|
inline |
Targets the andc instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
and of src0 and the negated value of src1 of type float.
|
inline |
Targets the andc64 instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
and of src0 and the negated value of src1 of type float2.
|
inline |
Targets the andc instruction.
| src0 | A value of type int. |
| src1 | A value of type int, can be a 12-bit constant. |
and of src0 and the negated value of src1 of type int.
|
inline |
Targets the andc instruction.
| src0 | A value of type unsigned. |
| src1 | A value of type unsigned, can be a 12-bit constant. |
and of src0 and the negated value of src1 of type unsigned.
|
inline |
The arcsin function, the inverse of sine.
| x | A value of type float. |
asin of x.
|
inline |
The arcsin function, the inverse of sine.
| x | A value of type float2. |
asin of x.
|
inline |
The arcsin function, the inverse of sine.
| x | A value of type half. |
asin of x.
|
inline |
The arcsin function, the inverse of sine.
| x | A value of type half2. |
asin of x.
|
inline |
The arcsin function, the inverse of sine.
| x | A value of type half4. |
asin of x.
|
inline |
The arcsinh function, the inverse of the hyperbolic sine.
| x | A value of type float. |
asinh of x.
|
inline |
The arcsinh function, the inverse of the hyperbolic sine.
| x | A value of type float2. |
asinh of x.
|
inline |
The arcsinh function, the inverse of the hyperbolic sine.
| x | A value of type half. |
asinh of x.
|
inline |
The arcsinh function, the inverse of the hyperbolic sine.
| x | A value of type half2. |
asinh of x.
|
inline |
The arcsinh function, the inverse of the hyperbolic sine.
| x | A value of type half4. |
asinh of x.
|
inline |
The arctan function, the inverse of tangent.
| x | A value of type float. |
atan of x.
|
inline |
The arctan function, the inverse of tangent.
| x | A value of type float2. |
atan of x.
|
inline |
The arctan function, the inverse of tangent.
| x | A value of type half. |
atan of x.
|
inline |
The arctan function, the inverse of tangent.
| x | A value of type half2. |
atan of x.
|
inline |
The arctan function, the inverse of tangent.
| x | A value of type half4. |
atan of x.
|
inline |
The arctangent of ( y )/( x ), in radians.
| x | A value of type float. |
| y | A value of type float. |
atan2 of x and y.
|
inline |
The arctangent of ( y )/( x ), in radians.
| x | A value of type float2. |
| y | A value of type float2. |
atan2 of x and y.
|
inline |
The arctangent of ( y )/( x ), in radians.
| x | A value of type half. |
| y | A value of type half. |
atan2 of x and y.
|
inline |
The arctangent of ( y )/( x ), in radians.
| x | A value of type half2. |
| y | A value of type half2. |
atan2 of x and y.
|
inline |
The arctangent of ( y )/( x ), in radians.
| x | A value of type half4. |
| y | A value of type half4. |
atan2 of x and y.
|
inline |
The arctanh function, the inverse of the hyperbolic tangent.
| x | A value of type float. |
atanh of x.
|
inline |
The arctanh function, the inverse of the hyperbolic tangent.
| x | A value of type float2. |
atanh of x.
|
inline |
The arctanh function, the inverse of the hyperbolic tangent.
| x | A value of type half. |
atanh of x.
|
inline |
The arctanh function, the inverse of the hyperbolic tangent.
| x | A value of type half2. |
atanh of x.
|
inline |
The arctanh function, the inverse of the hyperbolic tangent.
| x | A value of type half4. |
atanh of x.
|
inline |
Targets the f32v2axpy instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
res = a*src0 + src1. The scalar multiplicand a is provided by the internal state element $TAS.
|
inline |
Targets the bitrev8 instruction.
| src | A value of type int. |
int that is equivalent to the value of src with the bit order of each byte reversed.
|
inline |
The cubic root function.
| x | A value of type float. |
cbrt of x.
|
inline |
The cubic root function.
| x | A value of type float2. |
cbrt of x.
|
inline |
The cubic root function.
| x | A value of type half. |
cbrt of x.
|
inline |
The cubic root function.
| x | A value of type half2. |
cbrt of x.
|
inline |
The cubic root function.
| x | A value of type half4. |
cbrt of x.
|
inline |
Rounds up input to the closest integral value.
| x | A value of type float. |
x.
|
inline |
Rounds up input to the closest integral value.
| x | A value of type float2. |
x[i].
|
inline |
Rounds up input to the closest integral value.
| x | A value of type half. |
x.
|
inline |
Rounds up input to the closest integral value.
| x | A value of type half2. |
x[i].
|
inline |
Rounds up input to the closest integral value.
| x | A value of type half4. |
x[i].
|
inline |
Targets the f32clamp instruction.
| src0 | A value of type float. |
| src1 | A value of type float2. |
src0 and the two elements in src1.
|
inline |
Targets the f32v2clamp instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1, of type float2. The first element is the median of the first element of src0 and the two elements in src1. The second element is the median of the second element of src0 and the two elements in src1.
|
inline |
Targets the f16v2clamp instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1, of type half2. The first element is the median value of the first element of src0 and the two elements in src1. The second element is the median of the second element of src0 and the two elements in src1.
|
inline |
Targets the f16v4clamp instruction.
| src0 | A value of type half4. |
| src1 | A value of type half2. |
src0 and src1, of type half4. Each element is the median of the element in src0 at the same index, and the two values in src1.
|
inline |
Targets the clz instruction.
| src | A value of type int. |
src that are zero.
|
inline |
Targets the f16v2cmac instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
|
inline |
Targets the f16v4cmac instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
|
inline |
Targets the f32cmpeq instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
src0 and src1. If src0 == src1 the result will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32v2cmpeq instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1. If src0[i] == src1[i], the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v2cmpeq instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1. If src0[i] == src1[i], the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v4cmpeq instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
src0 and src1. If src0[i] == src1[i], the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32cmpge instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
src0 and src1. If src0 >= src1 the result will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32v2cmpge instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1. If src0[i] >= src1[i] the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v2cmpge instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1. If src0[i] >= src1[i] the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v4cmpge instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
src0 and src1. If src0[i] >= src1[i] the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32cmpgt instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
src0 and src1. If src0 > src1 the result will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32v2cmpgt instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1. If src0 > src1 the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v2cmpgt instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1. If src0 > src1 the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v4cmpgt instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
src0 and src1. If src0 > src1 the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32cmple instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
src0 and src1. If src0 <= src1 the result will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32v2cmple instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1. If src0 <= src1 the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v2cmple instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1. If src0 <= src1 the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v4cmple instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
src0 and src1. If src0 <= src1 the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32cmplt instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
src0 and src1. If src0 < src1 the result will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32v2cmplt instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1. If src0 < src1 the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v2cmplt instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1. If src0 < src1 the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v4cmplt instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
src0 and src1. If src0 < src1 the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32cmpne instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
src0 and src1. If src0 != src1 the result will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f32v2cmpne instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1. If src0[i] != src1[i], the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v2cmpne instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1. If src0[i] != src1[i], the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the f16v4cmpne instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
src0 and src1. If src0[i] != src1[i], the result vector element at index i will be 0xffff, and 0x0000 otherwise.
|
inline |
Targets the cms instruction.
| src | A value of type int. |
src that match the sign bit (bit 31), as an unsigned.
|
inline |
Composes a value of magnitude x with the sign of y.
| x | A value of type float. |
| y | A value of type float. |
copysign of x and y.
|
inline |
Composes a value of magnitude x with the sign of y.
| x | A value of type float2. |
| y | A value of type float2. |
copysign of x and y.
|
inline |
Composes a value of magnitude x with the sign of y.
| x | A value of type half. |
| y | A value of type half. |
copysign of x and y.
|
inline |
Composes a value of magnitude x with the sign of y.
| x | A value of type half2. |
| y | A value of type half2. |
copysign of x and y.
|
inline |
Composes a value of magnitude x with the sign of y.
| x | A value of type half4. |
| y | A value of type half4. |
copysign of x and y.
|
inline |
The trigonometric cosine function.
| x | A value of type float. |
cos of x.
|
inline |
The trigonometric cosine function.
| x | A value of type float2. |
cos of x.
|
inline |
The trigonometric cosine function.
| x | A value of type half. |
cos of x.
|
inline |
The trigonometric cosine function.
| x | A value of type half2. |
cos of x.
|
inline |
The trigonometric cosine function.
| x | A value of type half4. |
cos of x.
|
inline |
The hyperbolic cosine function.
| x | A value of type float. |
cosh of x.
|
inline |
The hyperbolic cosine function.
| x | A value of type float2. |
cosh of x.
|
inline |
The hyperbolic cosine function.
| x | A value of type half. |
cosh of x.
|
inline |
The hyperbolic cosine function.
| x | A value of type half2. |
cosh of x.
|
inline |
The hyperbolic cosine function.
| x | A value of type half4. |
cosh of x.
|
inline |
The error function.
| x | A value of type float. |
x.
|
inline |
The error function.
| x | A value of type float2. |
x.
|
inline |
The error function.
| x | A value of type half. |
x.
|
inline |
The error function.
| x | A value of type half2. |
x.
|
inline |
The error function.
| x | A value of type half4. |
x.
|
inline |
The complementary error function.
| x | A value of type float. |
x.
|
inline |
The complementary error function.
| x | A value of type float2. |
x.
|
inline |
The complementary error function.
| x | A value of type half. |
x.
|
inline |
The complementary error function.
| x | A value of type half2. |
x.
|
inline |
The complementary error function.
| x | A value of type half4. |
x.
|
inline |
Targets the f32exp instruction.
The base-e exponential function.
| src | A value of type float. |
e^{src}.| x | A value of type float. |
exp of x.
|
inline |
The base-e exponential function.
| x | A value of type float2. |
exp of x.
|
inline |
The base-e exponential function.
| x | A value of type half. |
exp of x.
|
inline |
Targets the f16v2exp instruction.
The base-e exponential function.
| src | A value of type half2. |
e^X of the two elements in src.| x | A value of type half2. |
exp of x.
|
inline |
The base-e exponential function.
| x | A value of type half4. |
exp of x.
|
inline |
Targets the f32exp instruction.
The base-2 exponential function.
| src | A value of type float. |
2^{src}.| x | A value of type float. |
exp2 of x.
|
inline |
The base-2 exponential function.
| x | A value of type float2. |
exp2 of x.
|
inline |
The base-2 exponential function.
| x | A value of type half. |
exp2 of x.
|
inline |
Targets the f16v2exp instruction.
The base-2 exponential function.
| src | A value of type half2. |
src.| x | A value of type half2. |
exp2 of x.
|
inline |
The base-2 exponential function.
| x | A value of type half4. |
exp2 of x.
|
inline |
The base-e exponential function, minus one: exp(x) - 1.
| x | A value of type float. |
expm1 of x.
|
inline |
The base-e exponential function, minus one: exp(x) - 1.
| x | A value of type float2. |
expm1 of x.
|
inline |
The base-e exponential function, minus one: exp(x) - 1.
| x | A value of type half. |
expm1 of x.
|
inline |
The base-e exponential function, minus one: exp(x) - 1.
| x | A value of type half2. |
expm1 of x.
|
inline |
The base-e exponential function, minus one: exp(x) - 1.
| x | A value of type half4. |
expm1 of x.
|
inline |
Targets the f16v2grand instruction.
|
inline |
Targets the f32v2grand instruction.
|
inline |
Computes the absolute value of the input.
| x | A value of type float. |
x.
|
inline |
Computes the absolute value of the input.
| x | A value of type float2. |
x[i].
|
inline |
Computes the absolute value of the input.
| x | A value of type half. |
x.
|
inline |
Computes the absolute value of the input.
| x | A value of type half2. |
x[i].
|
inline |
Computes the absolute value of the input.
| x | A value of type half4. |
x[i].
|
inline |
Calculates the absolute difference between the two inputs.
| x | A value of type float. |
| y | A value of type float. |
fdim of x and y.
|
inline |
Calculates the absolute difference between the two inputs.
| x | A value of type float2. |
| y | A value of type float2. |
fdim of x and y.
|
inline |
Calculates the absolute difference between the two inputs.
| x | A value of type half. |
| y | A value of type half. |
fdim of x and y.
|
inline |
Calculates the absolute difference between the two inputs.
| x | A value of type half2. |
| y | A value of type half2. |
fdim of x and y.
|
inline |
Calculates the absolute difference between the two inputs.
| x | A value of type half4. |
| y | A value of type half4. |
fdim of x and y.
|
inline |
Rounds down input to the closest integral value.
| x | A value of type float. |
x.
|
inline |
Rounds down input to the closest integral value.
| x | A value of type float2. |
x[i].
|
inline |
Rounds down input to the closest integral value.
| x | A value of type half. |
x.
|
inline |
Rounds down input to the closest integral value.
| x | A value of type half2. |
x[i].
|
inline |
Rounds down input to the closest integral value.
| x | A value of type half4. |
x[i].
|
inline |
Computes ( x * y ) + z.
| x | A value of type float. |
| y | A value of type float. |
| z | A value of type float. |
x * y ) + z.
|
inline |
Computes ( x * y ) + z.
| x | A value of type float2. |
| y | A value of type float2. |
| z | A value of type float2. |
x[i] * y[i] ) + z[i].
|
inline |
Computes ( x * y ) + z.
| x | A value of type half. |
| y | A value of type half. |
| z | A value of type half. |
x * y ) + z.
|
inline |
Computes ( x * y ) + z.
| x | A value of type half2. |
| y | A value of type half2. |
| z | A value of type half2. |
x[i] * y[i] ) + z[i].
|
inline |
Computes ( x * y ) + z.
| x | A value of type half4. |
| y | A value of type half4. |
| z | A value of type half4. |
x[i] * y[i] ) + z[i].
|
inline |
Calculates the maximum of the two inputs.
| x | A value of type float. |
| y | A value of type float. |
x and y. If one of them is a NaN, returns the other.
|
inline |
Calculates the maximum of the two inputs.
| x | A value of type float2. |
| y | A value of type float2. |
x[i] and y[i]. If either of them is a NaN, the other is set as the maximum.
|
inline |
Calculates the maximum of the two inputs.
| x | A value of type half. |
| y | A value of type half. |
x and y. If one of them is a NaN, returns the other.
|
inline |
Calculates the maximum of the two inputs.
| x | A value of type half2. |
| y | A value of type half2. |
x[i] and y[i]. If either of them is a NaN, the other is set as the maximum.
|
inline |
Calculates the maximum of the two inputs.
| x | A value of type half4. |
| y | A value of type half4. |
x[i] and y[i]. If either of them is a NaN, the other is set as the maximum.
|
inline |
Calculates the minimum of the two inputs.
| x | A value of type float. |
| y | A value of type float. |
x and y. If one of them is a NaN, returns the other.
|
inline |
Calculates the minimum of the two inputs.
| x | A value of type float2. |
| y | A value of type float2. |
x[i] and y[i]. If either of them is a NaN, the other is set as the minimum.
|
inline |
Calculates the minimum of the two inputs.
| x | A value of type half. |
| y | A value of type half. |
x and y. If one of them is a NaN, returns the other.
|
inline |
Calculates the minimum of the two inputs.
| x | A value of type half2. |
| y | A value of type half2. |
x[i] and y[i]. If either of them is a NaN, the other is set as the minimum.
|
inline |
Calculates the minimum of the two inputs.
| x | A value of type half4. |
| y | A value of type half4. |
x[i] and y[i]. If either of them is a NaN, the other is set as the minimum.
|
inline |
Calculates the remainder of the division x / y rounded towards zero.
| x | A value of type float. |
| y | A value of type float. |
fmod of x and y.
|
inline |
Calculates the remainder of the division x / y rounded towards zero.
| x | A value of type float2. |
| y | A value of type float2. |
fmod of x and y.
|
inline |
Calculates the remainder of the division x / y rounded towards zero.
| x | A value of type half. |
| y | A value of type half. |
fmod of x and y.
|
inline |
Calculates the remainder of the division x / y rounded towards zero.
| x | A value of type half2. |
| y | A value of type half2. |
fmod of x and y.
|
inline |
Calculates the remainder of the division x / y rounded towards zero.
| x | A value of type half4. |
| y | A value of type half4. |
fmod of x and y.
|
inline |
Calculates the hypotenuse of the right-angled triangle whose two shorter sides are of lengths given by the two inputs.
| x | A value of type float. |
| y | A value of type float. |
hypot of x and y.
|
inline |
Calculates the hypotenuse of the right-angled triangle whose two shorter sides are of lengths given by the two inputs.
| x | A value of type float2. |
| y | A value of type float2. |
hypot of x and y.
|
inline |
Calculates the hypotenuse of the right-angled triangle whose two shorter sides are of lengths given by the two inputs.
| x | A value of type half. |
| y | A value of type half. |
hypot of x and y.
|
inline |
Calculates the hypotenuse of the right-angled triangle whose two shorter sides are of lengths given by the two inputs.
| x | A value of type half2. |
| y | A value of type half2. |
hypot of x and y.
|
inline |
Calculates the hypotenuse of the right-angled triangle whose two shorter sides are of lengths given by the two inputs.
| x | A value of type half4. |
| y | A value of type half4. |
hypot of x and y.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type float. |
x rounded to a nearby integral of type long long.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type float2. |
x[i] rounded to a nearby integral, of type long long.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half. |
x rounded to a nearby integral of type long long.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half2. |
x[i] rounded to a nearby integral, of type long long.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half4. |
x[i] rounded to a nearby integral, of type long long.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type float. |
x as a long long, with halfway cases rounded away from zero.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type float2. |
x[i] as a long long, with halfway cases rounded away from zero.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type half. |
x as a long long, with halfway cases rounded away from zero.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type half2. |
x[i] as a long long, with halfway cases rounded away from zero.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type half4. |
x[i] as a long long, with halfway cases rounded away from zero.
|
inline |
Targets the f32ln instruction.
| src | A value of type half2. |
src.
|
inline |
Targets the f16v2ln instruction.
| src | A value of type half2. |
src.
|
inline |
Post-incrementing load, targeting the lds8step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a char.
|
inline |
Post-incrementing load, targeting the ld32step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a float.
|
inline |
Post-incrementing load, targeting the ld64step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a float2.
|
inline |
Post-incrementing load, targeting the ldb16step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a half.
|
inline |
Post-incrementing load, targeting the ld32step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a half2.
|
inline |
Post-incrementing load, targeting the ld64step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a half4.
|
inline |
Post-incrementing load, targeting the ld32step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as an int.
|
inline |
Post-incrementing load.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as an int2.
|
inline |
Post-incrementing load, targeting the lds16step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a short.
|
inline |
Post-incrementing load, targeting the ld32step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a short2.
|
inline |
Post-incrementing load.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a short4.
|
inline |
Post-incrementing load.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a uint2.
|
inline |
Post-incrementing load, targeting the ld32step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as an unsigned.
|
inline |
Post-incrementing load, targeting the ldz8step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as an unsigned char.
|
inline |
Post-incrementing load, targeting the ldz16step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as an unsigned short.
|
inline |
Post-incrementing load, targeting the ld32step instruction.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a ushort2.
|
inline |
Post-incrementing load.
| a | Address of the variable holding the address to load from. Gets incremented by i after the load. |
| i | Value by which to increment a after load. |
a, as a ushort4.
|
inline |
The natural logarithm.
| x | A value of type float. |
log of x.
|
inline |
The natural logarithm.
| x | A value of type float2. |
log of x.
|
inline |
The natural logarithm.
| x | A value of type half. |
log of x.
|
inline |
The natural logarithm.
| x | A value of type half2. |
log of x.
|
inline |
The natural logarithm.
| x | A value of type half4. |
log of x.
|
inline |
The base-10 logarithm.
| x | A value of type float. |
log10 of x.
|
inline |
The base-10 logarithm.
| x | A value of type float2. |
log10 of x.
|
inline |
The base-10 logarithm.
| x | A value of type half. |
log10 of x.
|
inline |
The base-10 logarithm.
| x | A value of type half2. |
log10 of x.
|
inline |
The base-10 logarithm.
| x | A value of type half4. |
log10 of x.
|
inline |
The natural logarithm of 1 + x.
| x | A value of type float. |
log1p of x.
|
inline |
The natural logarithm of 1 + x.
| x | A value of type float2. |
log1p of x.
|
inline |
The natural logarithm of 1 + x.
| x | A value of type half. |
log1p of x.
|
inline |
The natural logarithm of 1 + x.
| x | A value of type half2. |
log1p of x.
|
inline |
The natural logarithm of 1 + x.
| x | A value of type half4. |
log1p of x.
|
inline |
Targets the f32ln instruction.
The base-2 logarithm.
| src | A value of type half2. |
src.| x | A value of type float. |
log2 of x.
|
inline |
The base-2 logarithm.
| x | A value of type float2. |
log2 of x.
|
inline |
The base-2 logarithm.
| x | A value of type half. |
log2 of x.
|
inline |
Targets the f16v2log2 instruction.
The base-2 logarithm.
| src | A value of type half2. |
src.| x | A value of type half2. |
log2 of x.
|
inline |
The base-2 logarithm.
| x | A value of type half4. |
log2 of x.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type float. |
x rounded to a nearby integral of type long.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type float2. |
x[i] rounded to a nearby integral, of type long.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half. |
x rounded to a nearby integral of type long.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half2. |
x[i] rounded to a nearby integral, of type long.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half4. |
x[i] rounded to a nearby integral, of type long.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type float. |
x as a long, with halfway cases rounded away from zero.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type float2. |
x[i] as a long, with halfway cases rounded away from zero.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type half. |
x as a long, with halfway cases rounded away from zero.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type half2. |
x[i] as a long, with halfway cases rounded away from zero.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type half4. |
x[i] as a long, with halfway cases rounded away from zero.
|
inline |
Targets the f32max instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
src0 and src1.
|
inline |
Targets the f32v2max instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1.
|
inline |
Targets the f16v2max instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1.
|
inline |
Targets the f16v4max instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
src0 and src1.
|
inline |
Targets the f16v4maxc instruction.
| src | A value of type half4. |
src. The 0th element in the result vector is the maximum of src[0] and src[1], and the 1st element is the maximum of src[2] and src[3].
|
inline |
Targets the f32min instruction.
| src0 | A value of type float. |
| src1 | A value of type float. |
src0 and src1.
|
inline |
Targets the f32v2min instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1.
|
inline |
Targets the f16v2min instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1.
|
inline |
Targets the f16v4min instruction.
| src0 | A value of type half4. |
| src1 | A value of type half4. |
src0 and src1.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type float. |
x rounded to a nearby integral.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type float2. |
x[i] rounded to a nearby integral.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half. |
x rounded to a nearby integral.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half2. |
x[i] rounded to a nearby integral.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half4. |
x[i] rounded to a nearby integral.
|
inline |
Targets the popc instruction.
| src | A value of type int. |
src.
|
inline |
Calculates x to the power of y.
| x | A value of type float. |
| y | A value of type float. |
x )^( y )
|
inline |
Calculates x to the power of y.
| x | A value of type float2. |
| y | A value of type float2. |
x[i] raised to the power of y[i].
|
inline |
Calculates x to the power of y.
| x | A value of type half. |
| y | A value of type half. |
x )^( y )
|
inline |
Calculates x to the power of y.
| x | A value of type half2. |
| y | A value of type half2. |
x[i] raised to the power of y[i].
|
inline |
Calculates x to the power of y.
| x | A value of type half4. |
| y | A value of type half4. |
x[i] raised to the power of y[i].
|
inline |
Calculates the remainder of the division x / y, rounded to the nearest integral value, with halfway cases rounded to the even number.
| x | A value of type float. |
| y | A value of type float. |
remainder of x and y.
|
inline |
Calculates the remainder of the division x / y, rounded to the nearest integral value, with halfway cases rounded to the even number.
| x | A value of type float2. |
| y | A value of type float2. |
remainder of x and y.
|
inline |
Calculates the remainder of the division x / y, rounded to the nearest integral value, with halfway cases rounded to the even number.
| x | A value of type half. |
| y | A value of type half. |
remainder of x and y.
|
inline |
Calculates the remainder of the division x / y, rounded to the nearest integral value, with halfway cases rounded to the even number.
| x | A value of type half2. |
| y | A value of type half2. |
remainder of x and y.
|
inline |
Calculates the remainder of the division x / y, rounded to the nearest integral value, with halfway cases rounded to the even number.
| x | A value of type half4. |
| y | A value of type half4. |
remainder of x and y.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type float. |
x rounded to a nearby integral.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type float2. |
x[i] rounded to a nearby integral.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half. |
x rounded to a nearby integral.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half2. |
x[i] rounded to a nearby integral.
|
inline |
Rounds input to a nearby integral value, using the current rounding mode.
| x | A value of type half4. |
x[i] rounded to a nearby integral.
|
inline |
Targets the f32v2rmask instruction.
| src0 | A value of type float2. |
| src1 | A value of type float. |
src0, with each element of the input being individually masked with the probability specified by the bottom 17-bits of src1: src1[16] == 1, no masking is applied;src1[16:0] == 0, the result is a zero vector;src1[15:0] / 65536. PRNG is used by this instruction to generate 2 x 16-bit random values from the discrete uniform distribution.
|
inline |
Targets the f16v4rmask instruction.
| src0 | A value of type half4. |
| src1 | A value of type float. |
src0, with each element of the input being individually masked with the probability specified by the bottom 17-bits of src1: src1[16] == 1, no masking is applied;src1[16:0] == 0, the result is a zero vector;src1[15:0] / 65536. PRNG is used by this instruction to generate 4 x 16-bit random values from the discrete uniform distribution.
|
inline |
Targets the roll16 instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1, as a half2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 2 | 1 |
|
inline |
Targets the roll16 instruction.
| src0 | A value of type short2. |
| src1 | A value of type short2. |
src0 and src1, as a short2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 2 | 1 |
|
inline |
Targets the roll16 instruction.
| src0 | A value of type ushort2. |
| src1 | A value of type ushort2. |
src0 and src1, as a ushort2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 2 | 1 |
|
inline |
Targets the roll32 instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1, as a float2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 2 | 1 |
|
inline |
Targets the roll8l instruction.
| src0 | A value of type int. |
| src1 | A value of type int. |
src0 and src1, as an int. src0 src1 -> Result | 7 | 6 | 5 | 4 | | 3 | 2 | 1 | 0 | | 6 | 5 | 4 | 3 |
|
inline |
Targets the roll8r instruction.
| src0 | A value of type int. |
| src1 | A value of type int. |
src0 and src1, as an int. src0 src1 -> Result | 7 | 6 | 5 | 4 | | 3 | 2 | 1 | 0 | | 4 | 3 | 2 | 1 |
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type float. |
round of x.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type float2. |
round of x.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type half. |
round of x.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type half2. |
round of x.
|
inline |
Rounds input to nearest integral value, with halfway cases rounded away from zero.
| x | A value of type half4. |
round of x.
|
inline |
The reciprocal square root function.
| x | A value of type float. |
x.
|
inline |
The reciprocal square root function.
| x | A value of type float2. |
x[i].
|
inline |
The reciprocal square root function.
| x | A value of type half. |
x.
|
inline |
The reciprocal square root function.
| x | A value of type half2. |
x[i].
|
inline |
The reciprocal square root function.
| x | A value of type half4. |
x[i].
|
inline |
Targets the shuf8x8hi instruction.
| src0 | A value of type int. |
| src1 | A value of type int. |
src0 and src1, as an int. src0 src1 -> Result | 7 | 6 | 5 | 4 | | 3 | 2 | 1 | 0 | | 7 | 3 | 6 | 2 |
|
inline |
Targets the shuf8x8lo instruction.
| src0 | A value of type int. |
| src1 | A value of type int. |
src0 and src1, as an int. src0 src1 -> Result | 7 | 6 | 5 | 4 | | 3 | 2 | 1 | 0 | | 5 | 1 | 4 | 0 |
|
inline |
Targets the f32sigm instruction.
| src | A value of type float. |
src.
|
inline |
Targets the f16v2sigm instruction.
| src | A value of type half2. |
src.
|
inline |
The sigmoid function, ie 1/(1 + exp(- x )).
| x | A value of type float. |
sigmoid of x.
|
inline |
The sigmoid function, ie 1/(1 + exp(- x )).
| x | A value of type float2. |
sigmoid of x.
|
inline |
The sigmoid function, ie 1/(1 + exp(- x )).
| x | A value of type half. |
sigmoid of x.
|
inline |
The sigmoid function, ie 1/(1 + exp(- x )).
| x | A value of type half2. |
sigmoid of x.
|
inline |
The sigmoid function, ie 1/(1 + exp(- x )).
| x | A value of type half4. |
sigmoid of x.
|
inline |
The trigonometric sine function.
| x | A value of type float. |
sin of x.
|
inline |
The trigonometric sine function.
| x | A value of type float2. |
sin of x.
|
inline |
The trigonometric sine function.
| x | A value of type half. |
sin of x.
|
inline |
The trigonometric sine function.
| x | A value of type half2. |
sin of x.
|
inline |
The trigonometric sine function.
| x | A value of type half4. |
sin of x.
|
inline |
The hyperbolic sine function.
| x | A value of type float. |
sinh of x.
|
inline |
The hyperbolic sine function.
| x | A value of type float2. |
sinh of x.
|
inline |
The hyperbolic sine function.
| x | A value of type half. |
sinh of x.
|
inline |
The hyperbolic sine function.
| x | A value of type half2. |
sinh of x.
|
inline |
The hyperbolic sine function.
| x | A value of type half4. |
sinh of x.
|
inline |
Targets the sort4x16hi instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1, as a half2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 3 | 1 |
|
inline |
Targets the sort4x16hi instruction.
| src0 | A value of type short2. |
| src1 | A value of type short2. |
src0 and src1, as a short2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 3 | 1 |
|
inline |
Targets the sort4x16hi instruction.
| src0 | A value of type ushort2. |
| src1 | A value of type ushort2. |
src0 and src1, as a ushort2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 3 | 1 |
|
inline |
Targets the sort4x16lo instruction.
| src0 | A value of type half2. |
| src1 | A value of type half2. |
src0 and src1, as a half2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 2 | 0 |
|
inline |
Targets the sort4x16lo instruction.
| src0 | A value of type short2. |
| src1 | A value of type short2. |
src0 and src1, as a short2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 2 | 0 |
|
inline |
Targets the sort4x16lo instruction.
| src0 | A value of type ushort2. |
| src1 | A value of type ushort2. |
src0 and src1, as a ushort2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 2 | 0 |
|
inline |
Targets the sort4x32hi instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1, as a float2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 3 | 1 |
|
inline |
Targets the sort4x32lo instruction.
| src0 | A value of type float2. |
| src1 | A value of type float2. |
src0 and src1, as a float2. src0 src1 -> Result | 3 | 2 | | 1 | 0 | | 2 | 0 |
|
inline |
Targets the sort8 instruction.
| src | A value of type int. |
src, as an int. src -> Result | 3 | 2 | 1 | 0 | | 3 | 1 | 2 | 0 |
|
inline |
Targets the sort8x8hi instruction.
| src0 | A value of type int. |
| src1 | A value of type int. |
src0 and src1, as an int. src0 src1 -> Result | 7 | 6 | 5 | 4 | | 3 | 2 | 1 | 0 | | 7 | 5 | 3 | 1 |
|
inline |
Targets the sort8x8lo instruction.
| src0 | A value of type int. |
| src1 | A value of type int. |
src0 and src1, as an int. src0 src1 -> Result | 7 | 6 | 5 | 4 | | 3 | 2 | 1 | 0 | | 6 | 4 | 2 | 0 |
|
inline |
The square root function.
| x | A value of type float. |
sqrt of x.
|
inline |
The square root function.
| x | A value of type float2. |
sqrt of x.
|
inline |
The square root function.
| x | A value of type half. |
sqrt of x.
|
inline |
The square root function.
| x | A value of type half2. |
sqrt of x.
|
inline |
The square root function.
| x | A value of type half4. |
sqrt of x.
|
inline |
Post-incrementing store.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type char. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store, targeting the st32step instruction.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type float. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store, targeting the st64step instruction.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type float2. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store, targeting the st32step instruction.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type half2. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store, targeting the st64step instruction.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type half4. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store, targeting the stm32step instruction if i is a variable stride, and st32step otherwise.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type int. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type int2. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type short. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store, targeting the stm32step instruction if i is a variable stride, and st32step otherwise.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type short2. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type short4. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type uint2. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store, targeting the stm32step instruction if i is a variable stride, and st32step otherwise.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type unsigned. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type unsigned char. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type unsigned short. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store, targeting the stm32step instruction if i is a variable stride, and st32step otherwise.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type ushort2. |
| i | Value by which to increment a after store. |
|
inline |
Post-incrementing store.
| a | Address of the variable holding the address to store to. Gets incremented by i after the store. |
| v | Value to store, of type ushort4. |
| i | Value by which to increment a after store. |
|
inline |
Targets the f16v2sum instruction.
| src | A value of type half2. |
src as a float.
|
inline |
Targets the f16v4sum instruction.
| src | A value of type half2. |
src as a float2. The first element is the sum of src[0] and src[1], the second element is the sum of src[2] and src[3].
|
inline |
Targets the sort8 instruction.
| src | A value of type int. |
src, as an int. src -> Result | 3 | 2 | 1 | 0 | | 2 | 3 | 0 | 1 |
|
inline |
The trigonometric tangent function.
| x | A value of type float. |
tan of x.
|
inline |
The trigonometric tangent function.
| x | A value of type float2. |
tan of x.
|
inline |
The trigonometric tangent function.
| x | A value of type half. |
tan of x.
|
inline |
The trigonometric tangent function.
| x | A value of type half2. |
tan of x.
|
inline |
The trigonometric tangent function.
| x | A value of type half4. |
tan of x.
|
inline |
Targets the f32tanh instruction.
The hyperbolic tangent function.
| src | A value of type float. |
| x | A value of type float. |
tanh of x.
|
inline |
The hyperbolic tangent function.
| x | A value of type float2. |
tanh of x.
|
inline |
The hyperbolic tangent function.
| x | A value of type half. |
tanh of x.
|
inline |
Targets the f16v2tanh instruction.
The hyperbolic tangent function.
| src | A value of type half2. |
| x | A value of type half2. |
tanh of x.
|
inline |
The hyperbolic tangent function.
| x | A value of type half4. |
tanh of x.
|
inline |
The gamma function.
| x | A value of type float. |
tgamma of x.
|
inline |
The gamma function.
| x | A value of type float2. |
tgamma of x.
|
inline |
The gamma function.
| x | A value of type half. |
tgamma of x.
|
inline |
The gamma function.
| x | A value of type half2. |
tgamma of x.
|
inline |
The gamma function.
| x | A value of type half4. |
tgamma of x.
|
inline |
Rounds input towards zero to the nearest integral value that is not larger in magnitude than x.
| x | A value of type float. |
x.
|
inline |
Rounds input towards zero to the nearest integral value that is not larger in magnitude than x.
| x | A value of type float2. |
x[i] that is not larger in magnitude.
|
inline |
Rounds input towards zero to the nearest integral value that is not larger in magnitude than x.
| x | A value of type half. |
x.
|
inline |
Rounds input towards zero to the nearest integral value that is not larger in magnitude than x.
| x | A value of type half2. |
x[i] that is not larger in magnitude.
|
inline |
Rounds input towards zero to the nearest integral value that is not larger in magnitude than x.
| x | A value of type half4. |
x[i] that is not larger in magnitude.