Skip to content

Commit

Permalink
fix: fmha unrollList
Browse files Browse the repository at this point in the history
  • Loading branch information
byshiue committed Dec 16, 2022
1 parent 18aaefc commit 83776ae
Showing 1 changed file with 0 additions and 21 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -5294,9 +5294,6 @@ class FusedMultiHeadAttentionXMMAKernelV2:
int mD;
int mMaxBatch;
} unrollList[] = {
{kSM_75, fastertransformer::DATA_TYPE_FP16, 64, 32, 1},
{kSM_75, fastertransformer::DATA_TYPE_FP16, 64, 40, 1},
{kSM_75, fastertransformer::DATA_TYPE_FP16, 64, 64, 1},
{kSM_75, fastertransformer::DATA_TYPE_FP16, 128, 32, 1},
{kSM_75, fastertransformer::DATA_TYPE_FP16, 128, 40, 1},
{kSM_75, fastertransformer::DATA_TYPE_FP16, 128, 64, 1},
Expand All @@ -5307,9 +5304,6 @@ class FusedMultiHeadAttentionXMMAKernelV2:
{kSM_75, fastertransformer::DATA_TYPE_INT8, 256, 64, 1},
{kSM_75, fastertransformer::DATA_TYPE_INT8, 384, 64, 1},
#if CUDA_VERSION >= 11000
{kSM_80, fastertransformer::DATA_TYPE_FP16, 64, 32, 4},
{kSM_80, fastertransformer::DATA_TYPE_FP16, 64, 40, 4},
{kSM_80, fastertransformer::DATA_TYPE_FP16, 64, 64, 4},
{kSM_80, fastertransformer::DATA_TYPE_FP16, 128, 32, 4},
{kSM_80, fastertransformer::DATA_TYPE_FP16, 128, 40, 4},
{kSM_80, fastertransformer::DATA_TYPE_FP16, 128, 64, 4},
Expand All @@ -5320,9 +5314,6 @@ class FusedMultiHeadAttentionXMMAKernelV2:
{kSM_80, fastertransformer::DATA_TYPE_INT8, 256, 64, 8},
{kSM_80, fastertransformer::DATA_TYPE_INT8, 384, 64, 8},

{kSM_86, fastertransformer::DATA_TYPE_FP16, 64, 32, 4},
{kSM_86, fastertransformer::DATA_TYPE_FP16, 64, 40, 4},
{kSM_86, fastertransformer::DATA_TYPE_FP16, 64, 64, 4},
{kSM_86, fastertransformer::DATA_TYPE_FP16, 128, 32, 4},
{kSM_86, fastertransformer::DATA_TYPE_FP16, 128, 40, 4},
{kSM_86, fastertransformer::DATA_TYPE_FP16, 128, 64, 4},
Expand All @@ -5331,18 +5322,6 @@ class FusedMultiHeadAttentionXMMAKernelV2:
{kSM_86, fastertransformer::DATA_TYPE_INT8, 192, 64, 16},
{kSM_86, fastertransformer::DATA_TYPE_INT8, 256, 64, 8},
{kSM_86, fastertransformer::DATA_TYPE_INT8, 384, 64, 8},

{kSM_89, fastertransformer::DATA_TYPE_FP16, 64, 32, 4},
{kSM_89, fastertransformer::DATA_TYPE_FP16, 64, 40, 4},
{kSM_89, fastertransformer::DATA_TYPE_FP16, 64, 64, 4},
{kSM_89, fastertransformer::DATA_TYPE_FP16, 128, 32, 4},
{kSM_89, fastertransformer::DATA_TYPE_FP16, 128, 40, 4},
{kSM_89, fastertransformer::DATA_TYPE_FP16, 128, 64, 4},
{kSM_89, fastertransformer::DATA_TYPE_FP16, 256, 64, 4},
{kSM_89, fastertransformer::DATA_TYPE_INT8, 128, 64, 4},
{kSM_89, fastertransformer::DATA_TYPE_INT8, 192, 64, 16},
{kSM_89, fastertransformer::DATA_TYPE_INT8, 256, 64, 8},
{kSM_89, fastertransformer::DATA_TYPE_INT8, 384, 64, 8},
#endif
};
for (unsigned int i = 0u; i < sizeof(unrollList) / sizeof(unrollList[0]); ++i) {
Expand Down

0 comments on commit 83776ae

Please sign in to comment.