[dpdk-dev,1/3] arm: ret_vector.h improvements
Commit Message
added the definition of rte_xmm and xmm_t for acl noen implementation
removed the emulated _mm_* functions
Signed-off-by: Jerin Jacob <jerin.jacob@caviumnetworks.com>
---
lib/librte_eal/common/include/arch/arm/rte_vect.h | 58 +++++++----------------
1 file changed, 17 insertions(+), 41 deletions(-)
@@ -1,7 +1,7 @@
/*-
* BSD LICENSE
*
- * Copyright(c) 2015 RehiveTech. All rights reserved.
+ * Copyright(c) 2015 Cavium Networks. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
@@ -13,7 +13,7 @@
* notice, this list of conditions and the following disclaimer in
* the documentation and/or other materials provided with the
* distribution.
- * * Neither the name of RehiveTech nor the names of its
+ * * Neither the name of Cavium Networks nor the names of its
* contributors may be used to endorse or promote products derived
* from this software without specific prior written permission.
*
@@ -33,49 +33,25 @@
#ifndef _RTE_VECT_ARM_H_
#define _RTE_VECT_ARM_H_
+#include "arm_neon.h"
+
#ifdef __cplusplus
extern "C" {
#endif
-#define XMM_SIZE 16
-#define XMM_MASK (XMM_MASK - 1)
-
-typedef struct {
- union uint128 {
- uint8_t uint8[16];
- uint32_t uint32[4];
- } val;
-} __m128i;
-
-static inline __m128i
-_mm_set_epi32(uint32_t v0, uint32_t v1, uint32_t v2, uint32_t v3)
-{
- __m128i res;
-
- res.val.uint32[0] = v0;
- res.val.uint32[1] = v1;
- res.val.uint32[2] = v2;
- res.val.uint32[3] = v3;
- return res;
-}
-
-static inline __m128i
-_mm_loadu_si128(__m128i *v)
-{
- __m128i res;
-
- res = *v;
- return res;
-}
-
-static inline __m128i
-_mm_load_si128(__m128i *v)
-{
- __m128i res;
-
- res = *v;
- return res;
-}
+typedef int32x4_t xmm_t;
+
+#define XMM_SIZE (sizeof(xmm_t))
+#define XMM_MASK (XMM_SIZE - 1)
+
+typedef union rte_xmm {
+ xmm_t x;
+ uint8_t u8[XMM_SIZE / sizeof(uint8_t)];
+ uint16_t u16[XMM_SIZE / sizeof(uint16_t)];
+ uint32_t u32[XMM_SIZE / sizeof(uint32_t)];
+ uint64_t u64[XMM_SIZE / sizeof(uint64_t)];
+ double pd[XMM_SIZE / sizeof(double)];
+} __attribute__((aligned(16))) rte_xmm_t;
#ifdef __cplusplus
}