@@ -200,6 +200,11 @@ namespace hardcodedzero{
200
200
__grid_constant__ const SequenceLengthT queryLength,
201
201
__grid_constant__ const PSSM_2D_View<ScoreType> strided_PSSM
202
202
) {
203
+ if constexpr (std::is_same_v<ScoreType, short2 >) {
204
+ #if defined(__CUDA_ARCH__) && __CUDA_ARCH__ < 900
205
+ return ;
206
+ #endif
207
+ }
203
208
static_assert (numRegs % 4 == 0 );
204
209
static_assert (blocksize % group_size == 0 );
205
210
__builtin_assume (blockDim .x == blocksize);
@@ -604,6 +609,11 @@ namespace hardcodedzero{
604
609
__grid_constant__ float2 * const multiTileTempStorage,
605
610
__grid_constant__ const size_t tempStorageElementsPerGroup
606
611
) {
612
+ if constexpr (std::is_same_v<ScoreType, short2 >) {
613
+ #if defined(__CUDA_ARCH__) && __CUDA_ARCH__ < 900
614
+ return ;
615
+ #endif
616
+ }
607
617
static_assert (numRegs % 4 == 0 );
608
618
static_assert (blocksize % group_size == 0 );
609
619
__builtin_assume (blockDim .x == blocksize);
@@ -1293,6 +1303,11 @@ namespace kernelparamzero{
1293
1303
__grid_constant__ const PSSM_2D_View<ScoreType> strided_PSSM,
1294
1304
__grid_constant__ const ScoreType zero
1295
1305
) {
1306
+ if constexpr (std::is_same_v<ScoreType, short2 >) {
1307
+ #if defined(__CUDA_ARCH__) && __CUDA_ARCH__ < 900
1308
+ return ;
1309
+ #endif
1310
+ }
1296
1311
static_assert (numRegs % 4 == 0 );
1297
1312
static_assert (blocksize % group_size == 0 );
1298
1313
__builtin_assume (blockDim .x == blocksize);
@@ -1677,6 +1692,11 @@ namespace kernelparamzero{
1677
1692
__grid_constant__ const size_t tempStorageElementsPerGroup,
1678
1693
__grid_constant__ const ScoreType zero
1679
1694
) {
1695
+ if constexpr (std::is_same_v<ScoreType, short2 >) {
1696
+ #if defined(__CUDA_ARCH__) && __CUDA_ARCH__ < 900
1697
+ return ;
1698
+ #endif
1699
+ }
1680
1700
static_assert (numRegs % 4 == 0 );
1681
1701
static_assert (blocksize % group_size == 0 );
1682
1702
__builtin_assume (blockDim .x == blocksize);
0 commit comments