33 #include "NE10_types.h"
73 extern ne10_result_t (*
ne10_addc_float) (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
74 extern ne10_result_t ne10_addc_float_c (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
75 extern ne10_result_t ne10_addc_float_neon (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count)
asm (
"ne10_addc_float_neon");
76 extern ne10_result_t ne10_addc_float_asm (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
123 extern ne10_result_t (*
ne10_add_float) (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
124 extern ne10_result_t ne10_add_float_c (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
125 extern ne10_result_t ne10_add_float_neon (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count)
asm (
"ne10_add_float_neon");
126 extern ne10_result_t ne10_add_float_asm (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
189 extern ne10_result_t (*
ne10_addmat_4x4f) (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
190 extern ne10_result_t ne10_addmat_4x4f_c (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
191 extern ne10_result_t ne10_addmat_4x4f_neon (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
192 extern ne10_result_t ne10_addmat_4x4f_asm (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
201 extern ne10_result_t (*
ne10_addmat_3x3f) (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
202 extern ne10_result_t ne10_addmat_3x3f_c (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
203 extern ne10_result_t ne10_addmat_3x3f_neon (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
204 extern ne10_result_t ne10_addmat_3x3f_asm (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
213 extern ne10_result_t (*
ne10_addmat_2x2f) (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
214 extern ne10_result_t ne10_addmat_2x2f_c (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
215 extern ne10_result_t ne10_addmat_2x2f_neon (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
216 extern ne10_result_t ne10_addmat_2x2f_asm (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
244 extern ne10_result_t (*
ne10_subc_float) (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
245 extern ne10_result_t ne10_subc_float_c (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
246 extern ne10_result_t ne10_subc_float_neon (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
247 extern ne10_result_t ne10_subc_float_asm (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
293 extern ne10_result_t (*
ne10_sub_float) (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
294 extern ne10_result_t ne10_sub_float_c (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
295 extern ne10_result_t ne10_sub_float_neon (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count)
asm (
"ne10_sub_float_neon");
296 extern ne10_result_t ne10_sub_float_asm (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
358 extern ne10_result_t (*
ne10_rsbc_float) (ne10_float32_t * dst, ne10_float32_t *src,
const ne10_float32_t cst, ne10_uint32_t count);
359 extern ne10_result_t ne10_rsbc_float_c (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
360 extern ne10_result_t ne10_rsbc_float_neon (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
361 extern ne10_result_t ne10_rsbc_float_asm (ne10_float32_t * dst, ne10_float32_t *src,
const ne10_float32_t cst, ne10_uint32_t count);
423 extern ne10_result_t (*
ne10_submat_4x4f) (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
424 extern ne10_result_t ne10_submat_4x4f_c (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
425 extern ne10_result_t ne10_submat_4x4f_neon (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
426 extern ne10_result_t ne10_submat_4x4f_asm (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
436 extern ne10_result_t (*
ne10_submat_3x3f) (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
437 extern ne10_result_t ne10_submat_3x3f_c (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
438 extern ne10_result_t ne10_submat_3x3f_neon (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
439 extern ne10_result_t ne10_submat_3x3f_asm (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
449 extern ne10_result_t (*
ne10_submat_2x2f) (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
450 extern ne10_result_t ne10_submat_2x2f_c (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
451 extern ne10_result_t ne10_submat_2x2f_neon (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
452 extern ne10_result_t ne10_submat_2x2f_asm (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
479 extern ne10_result_t (*
ne10_mulc_float) (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
480 extern ne10_result_t ne10_mulc_float_c (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
481 extern ne10_result_t ne10_mulc_float_neon (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
482 extern ne10_result_t ne10_mulc_float_asm (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
528 extern ne10_result_t (*
ne10_mul_float) (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
529 extern ne10_result_t ne10_mul_float_c (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
530 extern ne10_result_t ne10_mul_float_neon (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count)
asm (
"ne10_mul_float_neon");
531 extern ne10_result_t ne10_mul_float_asm (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
596 extern ne10_result_t (*
ne10_mlac_float) (ne10_float32_t * dst, ne10_float32_t * acc, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
597 extern ne10_result_t ne10_mlac_float_c (ne10_float32_t * dst, ne10_float32_t * acc, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
598 extern ne10_result_t ne10_mlac_float_neon (ne10_float32_t * dst, ne10_float32_t * acc, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
599 extern ne10_result_t ne10_mlac_float_asm (ne10_float32_t * dst, ne10_float32_t * acc, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
652 extern ne10_result_t (*
ne10_mla_float) (ne10_float32_t * dst, ne10_float32_t * acc, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
653 extern ne10_result_t ne10_mla_float_c (ne10_float32_t * dst, ne10_float32_t * acc, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
654 extern ne10_result_t ne10_mla_float_neon (ne10_float32_t * dst, ne10_float32_t * acc, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count)
asm (
"ne10_mla_float_neon");
655 extern ne10_result_t ne10_mla_float_asm (ne10_float32_t * dst, ne10_float32_t * acc, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
718 extern ne10_result_t (*
ne10_mulmat_4x4f) (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
719 extern ne10_result_t ne10_mulmat_4x4f_c (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
720 extern ne10_result_t ne10_mulmat_4x4f_neon (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count)
asm (
"ne10_mulmat_4x4f_neon");
721 extern ne10_result_t ne10_mulmat_4x4f_asm (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
731 extern ne10_result_t (*
ne10_mulmat_3x3f) (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
732 extern ne10_result_t ne10_mulmat_3x3f_c (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
733 extern ne10_result_t ne10_mulmat_3x3f_neon (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count)
asm (
"ne10_mulmat_3x3f_neon");
734 extern ne10_result_t ne10_mulmat_3x3f_asm (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
744 extern ne10_result_t (*
ne10_mulmat_2x2f) (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
745 extern ne10_result_t ne10_mulmat_2x2f_c (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
746 extern ne10_result_t ne10_mulmat_2x2f_neon (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count)
asm (
"ne10_mulmat_2x2f_neon");
747 extern ne10_result_t ne10_mulmat_2x2f_asm (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
774 extern ne10_result_t ne10_mulcmatvec_cm4x4f_v4f_c (
ne10_vec4f_t * dst,
const ne10_mat4x4f_t * cst,
ne10_vec4f_t * src, ne10_uint32_t count);
775 extern ne10_result_t ne10_mulcmatvec_cm4x4f_v4f_neon (
ne10_vec4f_t * dst,
const ne10_mat4x4f_t * cst,
ne10_vec4f_t * src, ne10_uint32_t count)
asm (
"ne10_mulcmatvec_cm4x4f_v4f_neon");
776 extern ne10_result_t ne10_mulcmatvec_cm4x4f_v4f_asm (
ne10_vec4f_t * dst,
const ne10_mat4x4f_t * cst,
ne10_vec4f_t * src, ne10_uint32_t count);
786 extern ne10_result_t ne10_mulcmatvec_cm3x3f_v3f_c (
ne10_vec3f_t * dst,
const ne10_mat3x3f_t * cst,
ne10_vec3f_t * src, ne10_uint32_t count);
787 extern ne10_result_t ne10_mulcmatvec_cm3x3f_v3f_neon (
ne10_vec3f_t * dst,
const ne10_mat3x3f_t * cst,
ne10_vec3f_t * src, ne10_uint32_t count)
asm (
"ne10_mulcmatvec_cm3x3f_v3f_neon");
788 extern ne10_result_t ne10_mulcmatvec_cm3x3f_v3f_asm (
ne10_vec3f_t * dst,
const ne10_mat3x3f_t * cst,
ne10_vec3f_t * src, ne10_uint32_t count);
798 extern ne10_result_t ne10_mulcmatvec_cm2x2f_v2f_c (
ne10_vec2f_t * dst,
const ne10_mat2x2f_t * cst,
ne10_vec2f_t * src, ne10_uint32_t count);
799 extern ne10_result_t ne10_mulcmatvec_cm2x2f_v2f_neon (
ne10_vec2f_t * dst,
const ne10_mat2x2f_t * cst,
ne10_vec2f_t * src, ne10_uint32_t count)
asm (
"ne10_mulcmatvec_cm2x2f_v2f_neon");
800 extern ne10_result_t ne10_mulcmatvec_cm2x2f_v2f_asm (
ne10_vec2f_t * dst,
const ne10_mat2x2f_t * cst,
ne10_vec2f_t * src, ne10_uint32_t count);
828 extern ne10_result_t (*
ne10_divc_float) (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
829 extern ne10_result_t ne10_divc_float_c (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
830 extern ne10_result_t ne10_divc_float_neon (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
831 extern ne10_result_t ne10_divc_float_asm (ne10_float32_t * dst, ne10_float32_t * src,
const ne10_float32_t cst, ne10_uint32_t count);
876 extern ne10_result_t (*
ne10_div_float) (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
877 extern ne10_result_t ne10_div_float_c (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
878 extern ne10_result_t ne10_div_float_neon (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count)
asm (
"ne10_div_float_neon");
879 extern ne10_result_t ne10_div_float_asm (ne10_float32_t * dst, ne10_float32_t * src1, ne10_float32_t * src2, ne10_uint32_t count);
942 extern ne10_result_t (*
ne10_divmat_4x4f) (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
943 extern ne10_result_t ne10_divmat_4x4f_c (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
944 extern ne10_result_t ne10_divmat_4x4f_neon (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count)
asm (
"ne10_divmat_4x4f_neon");
945 extern ne10_result_t ne10_divmat_4x4f_asm (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count);
954 extern ne10_result_t (*
ne10_divmat_3x3f) (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
955 extern ne10_result_t ne10_divmat_3x3f_c (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
956 extern ne10_result_t ne10_divmat_3x3f_neon (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count)
asm (
"ne10_divmat_3x3f_neon");
957 extern ne10_result_t ne10_divmat_3x3f_asm (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count);
966 extern ne10_result_t (*
ne10_divmat_2x2f) (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
967 extern ne10_result_t ne10_divmat_2x2f_c (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
968 extern ne10_result_t ne10_divmat_2x2f_neon (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count)
asm (
"ne10_divmat_2x2f_neon");
969 extern ne10_result_t ne10_divmat_2x2f_asm (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count);
995 extern ne10_result_t (*
ne10_setc_float) (ne10_float32_t * dst,
const ne10_float32_t cst, ne10_uint32_t count);
996 extern ne10_result_t ne10_setc_float_c (ne10_float32_t * dst,
const ne10_float32_t cst, ne10_uint32_t count);
997 extern ne10_result_t ne10_setc_float_neon (ne10_float32_t * dst,
const ne10_float32_t cst, ne10_uint32_t count);
998 extern ne10_result_t ne10_setc_float_asm (ne10_float32_t * dst,
const ne10_float32_t cst, ne10_uint32_t count);
1057 extern ne10_result_t ne10_len_vec2f_c (ne10_float32_t * dst,
ne10_vec2f_t * src, ne10_uint32_t count);
1058 extern ne10_result_t ne10_len_vec2f_neon (ne10_float32_t * dst,
ne10_vec2f_t * src, ne10_uint32_t count)
asm (
"ne10_len_vec2f_neon");
1059 extern ne10_result_t ne10_len_vec2f_asm (ne10_float32_t * dst,
ne10_vec2f_t * src, ne10_uint32_t count);
1068 extern ne10_result_t ne10_len_vec3f_c (ne10_float32_t * dst,
ne10_vec3f_t * src, ne10_uint32_t count);
1069 extern ne10_result_t ne10_len_vec3f_neon (ne10_float32_t * dst,
ne10_vec3f_t * src, ne10_uint32_t count)
asm (
"ne10_len_vec3f_neon");
1070 extern ne10_result_t ne10_len_vec3f_asm (ne10_float32_t * dst,
ne10_vec3f_t * src, ne10_uint32_t count);
1079 extern ne10_result_t ne10_len_vec4f_c (ne10_float32_t * dst,
ne10_vec4f_t * src, ne10_uint32_t count);
1080 extern ne10_result_t ne10_len_vec4f_neon (ne10_float32_t * dst,
ne10_vec4f_t * src, ne10_uint32_t count)
asm (
"ne10_len_vec4f_neon");
1081 extern ne10_result_t ne10_len_vec4f_asm (ne10_float32_t * dst,
ne10_vec4f_t * src, ne10_uint32_t count);
1109 extern ne10_result_t ne10_normalize_vec2f_neon (
ne10_vec2f_t * dst,
ne10_vec2f_t * src, ne10_uint32_t count)
asm (
"ne10_normalize_vec2f_neon");
1120 extern ne10_result_t ne10_normalize_vec3f_neon (
ne10_vec3f_t * dst,
ne10_vec3f_t * src, ne10_uint32_t count)
asm (
"ne10_normalize_vec3f_neon");
1131 extern ne10_result_t ne10_normalize_vec4f_neon (
ne10_vec4f_t * dst,
ne10_vec4f_t * src, ne10_uint32_t count)
asm (
"ne10_normalize_vec4f_neon");
1159 extern ne10_result_t (*
ne10_abs_float) (ne10_float32_t * dst, ne10_float32_t * src, ne10_uint32_t count);
1160 extern ne10_result_t ne10_abs_float_c (ne10_float32_t * dst, ne10_float32_t * src, ne10_uint32_t count);
1161 extern ne10_result_t ne10_abs_float_neon (ne10_float32_t * dst, ne10_float32_t * src, ne10_uint32_t count)
asm (
"ne10_abs_float_neon");
1162 extern ne10_result_t ne10_abs_float_asm (ne10_float32_t * dst, ne10_float32_t * src, ne10_uint32_t count);
1172 extern ne10_result_t ne10_abs_vec2f_neon (
ne10_vec2f_t * dst,
ne10_vec2f_t * src, ne10_uint32_t count)
asm (
"ne10_abs_vec2f_neon");
1183 extern ne10_result_t ne10_abs_vec3f_neon (
ne10_vec3f_t * dst,
ne10_vec3f_t * src, ne10_uint32_t count)
asm (
"ne10_abs_vec3f_neon");
1194 extern ne10_result_t ne10_abs_vec4f_neon (
ne10_vec4f_t * dst,
ne10_vec4f_t * src, ne10_uint32_t count)
asm (
"ne10_abs_vec4f_neon");
1222 extern ne10_result_t ne10_dot_vec2f_c (ne10_float32_t * dst,
ne10_vec2f_t * src1,
ne10_vec2f_t * src2, ne10_uint32_t count);
1223 extern ne10_result_t ne10_dot_vec2f_neon (ne10_float32_t * dst,
ne10_vec2f_t * src1,
ne10_vec2f_t * src2, ne10_uint32_t count)
asm (
"ne10_dot_vec2f_neon");
1224 extern ne10_result_t ne10_dot_vec2f_asm (ne10_float32_t * dst,
ne10_vec2f_t * src1,
ne10_vec2f_t * src2, ne10_uint32_t count);
1234 extern ne10_result_t ne10_dot_vec3f_c (ne10_float32_t * dst,
ne10_vec3f_t * src1,
ne10_vec3f_t * src2, ne10_uint32_t count);
1235 extern ne10_result_t ne10_dot_vec3f_neon (ne10_float32_t * dst,
ne10_vec3f_t * src1,
ne10_vec3f_t * src2, ne10_uint32_t count)
asm (
"ne10_dot_vec3f_neon");
1236 extern ne10_result_t ne10_dot_vec3f_asm (ne10_float32_t * dst,
ne10_vec3f_t * src1,
ne10_vec3f_t * src2, ne10_uint32_t count);
1246 extern ne10_result_t ne10_dot_vec4f_c (ne10_float32_t * dst,
ne10_vec4f_t * src1,
ne10_vec4f_t * src2, ne10_uint32_t count);
1247 extern ne10_result_t ne10_dot_vec4f_neon (ne10_float32_t * dst,
ne10_vec4f_t * src1,
ne10_vec4f_t * src2, ne10_uint32_t count)
asm (
"ne10_dot_vec4f_neon");
1248 extern ne10_result_t ne10_dot_vec4f_asm (ne10_float32_t * dst,
ne10_vec4f_t * src1,
ne10_vec4f_t * src2, ne10_uint32_t count);
1305 extern ne10_result_t (*
ne10_detmat_4x4f) (ne10_float32_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count);
1306 extern ne10_result_t ne10_detmat_4x4f_c (ne10_float32_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count);
1307 extern ne10_result_t ne10_detmat_4x4f_neon (ne10_float32_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count)
asm (
"ne10_detmat_4x4f_neon");
1308 extern ne10_result_t ne10_detmat_4x4f_asm (ne10_float32_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count);
1316 extern ne10_result_t (*
ne10_detmat_3x3f) (ne10_float32_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count);
1317 extern ne10_result_t ne10_detmat_3x3f_c (ne10_float32_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count);
1318 extern ne10_result_t ne10_detmat_3x3f_neon (ne10_float32_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count)
asm (
"ne10_detmat_3x3f_neon");
1319 extern ne10_result_t ne10_detmat_3x3f_asm (ne10_float32_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count);
1327 extern ne10_result_t (*
ne10_detmat_2x2f) (ne10_float32_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count);
1328 extern ne10_result_t ne10_detmat_2x2f_c (ne10_float32_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count);
1329 extern ne10_result_t ne10_detmat_2x2f_neon (ne10_float32_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count)
asm (
"ne10_detmat_2x2f_neon");
1330 extern ne10_result_t ne10_detmat_2x2f_asm (ne10_float32_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count);
1355 extern ne10_result_t (*
ne10_invmat_4x4f) (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count);
1356 extern ne10_result_t ne10_invmat_4x4f_c (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count);
1357 extern ne10_result_t ne10_invmat_4x4f_neon (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count)
asm (
"ne10_invmat_4x4f_neon");
1358 extern ne10_result_t ne10_invmat_4x4f_asm (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count);
1366 extern ne10_result_t (*
ne10_invmat_3x3f) (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count);
1367 extern ne10_result_t ne10_invmat_3x3f_c (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count);
1368 extern ne10_result_t ne10_invmat_3x3f_neon (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count)
asm (
"ne10_invmat_3x3f_neon");
1369 extern ne10_result_t ne10_invmat_3x3f_asm (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count);
1377 extern ne10_result_t (*
ne10_invmat_2x2f) (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count);
1378 extern ne10_result_t ne10_invmat_2x2f_c (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count);
1379 extern ne10_result_t ne10_invmat_2x2f_neon (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count)
asm (
"ne10_invmat_2x2f_neon");
1380 extern ne10_result_t ne10_invmat_2x2f_asm (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count);
1405 extern ne10_result_t (*
ne10_transmat_4x4f) (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count);
1406 extern ne10_result_t ne10_transmat_4x4f_c (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count);
1407 extern ne10_result_t ne10_transmat_4x4f_neon (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count)
asm (
"ne10_transmat_4x4f_neon");
1408 extern ne10_result_t ne10_transmat_4x4f_asm (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src, ne10_uint32_t count);
1416 extern ne10_result_t (*
ne10_transmat_3x3f) (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count);
1417 extern ne10_result_t ne10_transmat_3x3f_c (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count);
1418 extern ne10_result_t ne10_transmat_3x3f_neon (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count)
asm (
"ne10_transmat_3x3f_neon");
1419 extern ne10_result_t ne10_transmat_3x3f_asm (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src, ne10_uint32_t count);
1427 extern ne10_result_t (*
ne10_transmat_2x2f) (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count);
1428 extern ne10_result_t ne10_transmat_2x2f_c (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count);
1429 extern ne10_result_t ne10_transmat_2x2f_neon (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count)
asm (
"ne10_transmat_2x2f_neon");
1430 extern ne10_result_t ne10_trans_mat2x2f_asm (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src, ne10_uint32_t count);
1455 extern ne10_result_t ne10_identitymat_4x4f_c (ne10_mat4x4f_t * dst, ne10_uint32_t count);
1456 extern ne10_result_t ne10_identitymat_4x4f_neon (ne10_mat4x4f_t * dst, ne10_uint32_t count)
asm (
"ne10_identitymat_4x4f_neon");
1457 extern ne10_result_t ne10_identitymat_4x4f_asm (ne10_mat4x4f_t * dst, ne10_uint32_t count);
1465 extern ne10_result_t ne10_identitymat_3x3f_c (ne10_mat3x3f_t * dst, ne10_uint32_t count);
1466 extern ne10_result_t ne10_identitymat_3x3f_neon (ne10_mat3x3f_t * dst, ne10_uint32_t count)
asm (
"ne10_identitymat_3x3f_neon");
1467 extern ne10_result_t ne10_identitymat_3x3f_asm (ne10_mat3x3f_t * dst, ne10_uint32_t count);
1475 extern ne10_result_t ne10_identitymat_2x2f_c (ne10_mat2x2f_t * dst, ne10_uint32_t count);
1476 extern ne10_result_t ne10_identitymat_2x2f_neon (ne10_mat2x2f_t * dst, ne10_uint32_t count)
asm (
"ne10_identitymat_2x2f_neon");
1477 extern ne10_result_t ne10_identity_mat2x2f_asm (ne10_mat2x2f_t * dst, ne10_uint32_t count);