40 for (
unsigned int itr = 0; itr < count; itr++ )
42 dst[ itr ] = acc[ itr ] + (src1[ itr ] * src2[ itr ]);
50 for (
unsigned int itr = 0; itr < count; itr++ )
52 dst[ itr ].
x = acc[ itr ].
x + (src1[ itr ].
x * src2[ itr ].
x);
53 dst[ itr ].
y = acc[ itr ].
y + (src1[ itr ].
y * src2[ itr ].
y);
61 for (
unsigned int itr = 0; itr < count; itr++ )
63 dst[ itr ].
x = acc[ itr ].
x + (src1[ itr ].
x * src2[ itr ].
x);
64 dst[ itr ].
y = acc[ itr ].
y + (src1[ itr ].
y * src2[ itr ].
y);
65 dst[ itr ].
z = acc[ itr ].
z + (src1[ itr ].
z * src2[ itr ].
z);
73 for (
unsigned int itr = 0; itr < count; itr++ )
75 dst[ itr ].
x = acc[ itr ].
x + (src1[ itr ].
x * src2[ itr ].
x);
76 dst[ itr ].
y = acc[ itr ].
y + (src1[ itr ].
y * src2[ itr ].
y);
77 dst[ itr ].
z = acc[ itr ].
z + (src1[ itr ].
z * src2[ itr ].
z);
78 dst[ itr ].
w = acc[ itr ].
w + (src1[ itr ].
w * src2[ itr ].
w);
ne10_result_t ne10_vmla_vec4f_c(ne10_vec4f_t *dst, ne10_vec4f_t *acc, ne10_vec4f_t *src1, ne10_vec4f_t *src2, ne10_uint32_t count)
Specific implementation of ne10_vmla_vec4f using plain C code.
A 2-tuple of ne10_float32_t values.
ne10_result_t ne10_vmla_vec3f_c(ne10_vec3f_t *dst, ne10_vec3f_t *acc, ne10_vec3f_t *src1, ne10_vec3f_t *src2, ne10_uint32_t count)
Specific implementation of ne10_vmla_vec3f using plain C code.
ne10_result_t ne10_vmla_vec2f_c(ne10_vec2f_t *dst, ne10_vec2f_t *acc, ne10_vec2f_t *src1, ne10_vec2f_t *src2, ne10_uint32_t count)
Specific implementation of ne10_vmla_vec2f using plain C code.
A 3-tuple of ne10_float32_t values.
#define NE10_CHECKPOINTER_DstSrc1Src2
A 4-tuple of ne10_float32_t values.
ne10_result_t ne10_mla_float_c(ne10_float32_t *dst, ne10_float32_t *acc, ne10_float32_t *src1, ne10_float32_t *src2, ne10_uint32_t count)
Specific implementation of ne10_mla_float using plain C code.