|
| 1 | +#ifndef X86_SIMD_SORT_STATIC_METHODS |
| 2 | +#define X86_SIMD_SORT_STATIC_METHODS |
| 3 | +#include <vector> |
| 4 | +#include <stdlib.h> |
| 5 | +// Declare all methods: |
| 6 | +namespace x86simdsortStatic { |
| 7 | +template <typename T> |
| 8 | +X86_SIMD_SORT_FINLINE void qsort(T *arr, size_t size, bool hasnan = true); |
| 9 | + |
| 10 | +template <typename T> |
| 11 | +X86_SIMD_SORT_FINLINE void |
| 12 | +qselect(T *arr, size_t k, size_t size, bool hasnan = true); |
| 13 | + |
| 14 | +template <typename T> |
| 15 | +X86_SIMD_SORT_FINLINE void |
| 16 | +partial_qsort(T *arr, size_t k, size_t size, bool hasnan = true); |
| 17 | + |
| 18 | +template <typename T> |
| 19 | +X86_SIMD_SORT_FINLINE std::vector<size_t> |
| 20 | +argsort(T *arr, size_t size, bool hasnan = true); |
| 21 | + |
| 22 | +template <typename T> |
| 23 | +std::vector<size_t> X86_SIMD_SORT_FINLINE |
| 24 | +argselect(T *arr, size_t k, size_t size, bool hasnan = true); |
| 25 | + |
| 26 | +template <typename T1, typename T2> |
| 27 | +X86_SIMD_SORT_FINLINE void |
| 28 | +keyvalue_qsort(T1 *key, T2 *val, size_t size, bool hasnan = true); |
| 29 | +} // namespace x86simdsortStatic |
| 30 | + |
| 31 | +#define XSS_METHODS(ISA) \ |
| 32 | + template <typename T> \ |
| 33 | + X86_SIMD_SORT_FINLINE void x86simdsortStatic::qsort( \ |
| 34 | + T *arr, size_t size, bool hasnan) \ |
| 35 | + { \ |
| 36 | + ISA##_qsort(arr, size, hasnan); \ |
| 37 | + } \ |
| 38 | + template <typename T> \ |
| 39 | + X86_SIMD_SORT_FINLINE void x86simdsortStatic::qselect( \ |
| 40 | + T *arr, size_t k, size_t size, bool hasnan) \ |
| 41 | + { \ |
| 42 | + ISA##_qselect(arr, k, size, hasnan); \ |
| 43 | + } \ |
| 44 | + template <typename T> \ |
| 45 | + X86_SIMD_SORT_FINLINE void x86simdsortStatic::partial_qsort( \ |
| 46 | + T *arr, size_t k, size_t size, bool hasnan) \ |
| 47 | + { \ |
| 48 | + ISA##_partial_qsort(arr, k, size, hasnan); \ |
| 49 | + } \ |
| 50 | + template <typename T> \ |
| 51 | + X86_SIMD_SORT_FINLINE std::vector<size_t> x86simdsortStatic::argsort( \ |
| 52 | + T *arr, size_t size, bool hasnan) \ |
| 53 | + { \ |
| 54 | + return ISA##_argsort(arr, size, hasnan); \ |
| 55 | + } \ |
| 56 | + template <typename T> \ |
| 57 | + X86_SIMD_SORT_FINLINE std::vector<size_t> x86simdsortStatic::argselect( \ |
| 58 | + T *arr, size_t k, size_t size, bool hasnan) \ |
| 59 | + { \ |
| 60 | + return ISA##_argselect(arr, k, size, hasnan); \ |
| 61 | + } |
| 62 | + |
| 63 | +/* |
| 64 | + * qsort, qselect, partial, argsort key-value sort template functions. |
| 65 | + */ |
| 66 | +#include "xss-common-qsort.h" |
| 67 | +#include "xss-common-argsort.h" |
| 68 | + |
| 69 | +#if defined(__AVX512DQ__) && defined(__AVX512VL__) |
| 70 | +/* 32-bit and 64-bit dtypes vector definitions on SKX */ |
| 71 | +#include "avx512-32bit-qsort.hpp" |
| 72 | +#include "avx512-64bit-qsort.hpp" |
| 73 | +#include "avx512-64bit-argsort.hpp" |
| 74 | +#include "avx512-64bit-keyvaluesort.hpp" |
| 75 | + |
| 76 | +/* 16-bit dtypes vector definitions on ICL */ |
| 77 | +#if defined(__AVX512BW__) && defined(__AVX512VBMI2__) |
| 78 | +#include "avx512-16bit-qsort.hpp" |
| 79 | +/* _Float16 vector definition on SPR*/ |
| 80 | +#if defined(__FLT16_MAX__) && defined(__AVX512BW__) && defined(__AVX512FP16__) |
| 81 | +#include "avx512fp16-16bit-qsort.hpp" |
| 82 | +#endif // __FLT16_MAX__ |
| 83 | +#endif // __AVX512VBMI2__ |
| 84 | + |
| 85 | +XSS_METHODS(avx512) |
| 86 | + |
| 87 | +// key-value currently only on avx512 |
| 88 | +template <typename T1, typename T2> |
| 89 | +X86_SIMD_SORT_FINLINE void |
| 90 | +x86simdsortStatic::keyvalue_qsort(T1 *key, T2 *val, size_t size, bool hasnan) |
| 91 | +{ |
| 92 | + avx512_qsort_kv(key, val, size, hasnan); |
| 93 | +} |
| 94 | + |
| 95 | +#elif defined(__AVX2__) && !defined(__AVX512F__) |
| 96 | +/* 32-bit and 64-bit dtypes vector definitions on AVX2 */ |
| 97 | +#include "avx2-32bit-half.hpp" |
| 98 | +#include "avx2-32bit-qsort.hpp" |
| 99 | +#include "avx2-64bit-qsort.hpp" |
| 100 | +XSS_METHODS(avx2) |
| 101 | + |
| 102 | +#else |
| 103 | +#error "x86simdsortStatic methods needs to be compiled with avx512/avx2 specific flags" |
| 104 | +#endif // (__AVX512VL__ && __AVX512DQ__) || AVX2 |
| 105 | + |
| 106 | +#endif // X86_SIMD_SORT_STATIC_METHODS |
0 commit comments