Commit 1b5cf348 authored by James Willis's avatar James Willis
Browse files

Fixed bugs in AVX-512 instructions.

parent a239328b
......@@ -116,10 +116,13 @@
for (int i = 0; i < VEC_SIZE; i++) b += a.f[i]; \
/* Calculates the number of set bits in the mask and adds the result to an int.
#define VEC_FORM_PACKED_MASK(mask, v_mask, pack) \
pack += __builtin_popcount(mask);
/* Do nothing in the case of AVX-512 as there are already
* instructions for left-packing.*/
#define VEC_FORM_PACKED_MASK(mask, packed_mask) packed_mask = mask
/* Finds the horizontal maximum of vector b and returns a float. */
#define VEC_HMAX(a, b) b = _mm512_reduce_max_ps(a.v)
/* Performs a left-pack on a vector based upon a mask and returns the result. */
#define VEC_LEFT_PACK(a, mask, result) \
Supports Markdown
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment