45#if defined(__SSE2__) || (defined(_MSC_VER) && !defined(_M_ARM64))
47#if defined(__AVX512VL__) || defined(__AVX10_1__)
59#if defined(__SSE4_1__) || (defined(_MSC_VER) && !defined(_M_ARM64))
60#if !defined(__AVX512VL__) && !defined(__AVX10_1__) && defined(__GNUC__) && \
61 __GNUC__ >= 5 && !defined(__clang__)
66#if defined(__AVX512VL__) || defined(__AVX10_1__)
68#elif defined(__clang__)
87#if (!defined(__GNUC__) || __GNUC__ >= 8) || defined(__clang__)
95#if (!defined(__GNUC__) || __GNUC__ >= 8) || defined(__clang__)
103#if defined(__AVX512VL__) || defined(__AVX10_1__)
114#if !defined(__AVX512VL__) && !defined(__AVX10_1__) && defined(__GNUC__) && \
115 __GNUC__ >= 5 && !defined(__clang__)
120#if defined(__AVX512VL__) || defined(__AVX10_1__)
122#elif defined(__clang__)
128 19342813113834066795298816.)));
140#if defined(__AVX512F__) || defined(__AVX10_512BIT__)
cudaStream_t stream[1]
CUDA streams for parallel computing on CPU and GPU.