Skip to content

Commit

Permalink
update block size for standalone_cint_v4
Browse files Browse the repository at this point in the history
Differential Revision: D66350756
  • Loading branch information
zhaozhul authored and facebook-github-bot committed Nov 22, 2024
1 parent 55e346c commit ae4905f
Showing 1 changed file with 6 additions and 2 deletions.
8 changes: 6 additions & 2 deletions generative_recommenders/ops/triton/triton_jagged.py
Original file line number Diff line number Diff line change
Expand Up @@ -1166,6 +1166,8 @@ def _get_concat_2D_jagged_tritoncc_named_specs() -> List[VersionedSpec]:
(256, "*fp32"),
(512, "*bf16"),
(512, "*fp32"),
(1024, "*bf16"),
(1024, "*fp32"),
]
for offsets_b_type in ["*i64", "*i32"]
for IS_DENSE_A, IS_DENSE_B in [(False, False), (True, False), (False, True)]
Expand Down Expand Up @@ -1306,6 +1308,8 @@ def _get_concat_2D_jagged_tritoncc_named_specs() -> List[VersionedSpec]:
(256, "*fp32"),
(512, "*bf16"),
(512, "*fp32"),
(1024, "*bf16"),
(1024, "*fp32"),
]
for offsets_b_type in ["*i64", "*i32"]
for IS_DENSE_A, IS_DENSE_B in [(False, False), (True, False), (False, True)]
Expand Down Expand Up @@ -1502,7 +1506,7 @@ def _get_split_2D_jagged_tritoncc_named_specs() -> List[VersionedSpec]:
},
default_values=default_values,
)
for BLOCK_D in [64, 128, 256, 512]
for BLOCK_D in [64, 128, 256, 512, 1024]
for dtype in ["*bf16", "*fp32"]
for offsets_a_type in ["*i64", "*i32"]
for offsets_b_type in ["*i64", "*i32"]
Expand Down Expand Up @@ -1556,7 +1560,7 @@ def _get_split_2D_jagged_tritoncc_named_specs() -> List[VersionedSpec]:
default_values=default_values,
version="standalone_cint_v4",
)
for BLOCK_D in [64, 128, 256, 512]
for BLOCK_D in [64, 128, 256, 512, 1024]
for dtype in ["*bf16", "*fp32"]
for offsets_a_type in ["*i64", "*i32"]
for offsets_b_type in ["*i64", "*i32"]
Expand Down

0 comments on commit ae4905f

Please sign in to comment.