/* * Copyright (C) 2022 NHR@FAU, University Erlangen-Nuremberg. * All rights reserved. This file is part of MD-Bench. * Use of this source code is governed by a LGPL-3.0 * license that can be found in the LICENSE file. */ #include #include #include #include #ifndef NO_ZMM_INTRIN # include #endif #ifndef CLUSTER_M # define CLUSTER_M 1 #endif #ifndef CLUSTER_N # define CLUSTER_N 1 #endif #ifdef AVX512 # if PRECISION == 2 # include "simd/avx512_double.h" # else # include "simd/avx512_float.h" # endif #else # if PRECISION == 2 # include "simd/avx_avx2_double.h" # else # include "simd/avx_avx2_float.h" # endif #endif #define SIMD_PRINT_REAL(a) simd_print_real(#a, a); #define SIMD_PRINT_MASK(a) simd_print_mask(#a, a); static inline void simd_print_real(const char *ref, MD_SIMD_FLOAT a) { double x[VECTOR_WIDTH]; memcpy(x, &a, sizeof(x)); fprintf(stdout, "%s: ", ref); for(int i = 0; i < VECTOR_WIDTH; i++) { fprintf(stdout, "%f ", x[i]); } fprintf(stdout, "\n"); } static inline void simd_print_mask(const char *ref, MD_SIMD_MASK a) { fprintf(stdout, "%s: %x\n", ref, simd_mask_to_u32(a)); }