Skip to content

Commit dbcac52

Browse files
committed
add vectorcall
1 parent 044b254 commit dbcac52

File tree

1 file changed

+6
-6
lines changed

1 file changed

+6
-6
lines changed

src/board.c

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -293,7 +293,7 @@ bool board_lesser(const Board *b1, const Board *b2)
293293
* @param b the bitboard
294294
* @return a 128 bitboard mirrored
295295
*/
296-
static __m128i horizontal_mirror_mm(const __m128i b)
296+
static vectorcall __m128i horizontal_mirror_mm(const __m128i b)
297297
{
298298
const __m128i mask = _mm_set1_epi16(0x0F0F);
299299
const __m128i rev = _mm_set_epi8(H_MIRROR);
@@ -306,7 +306,7 @@ static __m128i horizontal_mirror_mm(const __m128i b)
306306
* @param b the bitboard
307307
* @return a 128 bitboard mirrored
308308
*/
309-
static __m128i vertical_mirror_mm(const __m128i b)
309+
static vectorcall __m128i vertical_mirror_mm(const __m128i b)
310310
{
311311
return _mm_shuffle_epi8(b, _mm_set_epi8(V_MIRROR));
312312
}
@@ -317,7 +317,7 @@ static __m128i vertical_mirror_mm(const __m128i b)
317317
* @param b the bitboard
318318
* @return a 128 bitboard transposed
319319
*/
320-
static __m128i transpose_mm(__m128i b)
320+
static vectorcall __m128i transpose_mm(__m128i b)
321321
{
322322
const __m128i mask00AA = _mm_set1_epi16(0x00AA);
323323
const __m128i maskCCCC = _mm_set1_epi32(0x0000CCCC);
@@ -342,7 +342,7 @@ static __m128i transpose_mm(__m128i b)
342342
* @param b input boards
343343
* @param sym output boards
344344
*/
345-
static void horizontal_mirror_avx2(const __m256i *b, __m256i *sym)
345+
static vectorcall void horizontal_mirror_avx2(const __m256i *b, __m256i *sym)
346346
{
347347
const __m256i mask = _mm256_set1_epi16(0x0F0F);
348348
const __m256i rev = _mm256_set_epi8(H_MIRROR, H_MIRROR);
@@ -356,7 +356,7 @@ static void horizontal_mirror_avx2(const __m256i *b, __m256i *sym)
356356
* @param b input boards
357357
* @param sym output boards
358358
*/
359-
static void vertical_mirror_avx2(const __m256i *b, __m256i *sym)
359+
static vectorcall void vertical_mirror_avx2(const __m256i *b, __m256i *sym)
360360
{
361361
const __m256i mask = _mm256_set_epi8( V_MIRROR, V_MIRROR);
362362
*sym = _mm256_shuffle_epi8(*b, mask);
@@ -1273,7 +1273,7 @@ uint64_t get_full_lines(const uint64_t disc, uint64_t full[4])
12731273
// too slow on zen3 cpu
12741274
#if 0 && USE_SIMD && defined(__AVX2__)
12751275

1276-
static uint64_t get_stable_by_contact(const uint64_t central_mask, const uint64_t previous_stable, const __m256i full)
1276+
static uint64_t vectorcall get_stable_by_contact(const uint64_t central_mask, const uint64_t previous_stable, const __m256i full)
12771277
{
12781278
__m128i stable, old_stable, central_mask_v2;
12791279
__m256i stable_v4;

0 commit comments

Comments
 (0)