Skip to content

Commit

Permalink
[Kernel] Add punica dimensions for Granite 3b and 8b (vllm-project#5930)
Browse files Browse the repository at this point in the history
Signed-off-by: Joe Runde <joe@joerun.de>
  • Loading branch information
joerunde authored and prashantgupta24 committed Jul 1, 2024
1 parent a62d9e5 commit cc6f113
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 0 deletions.
2 changes: 2 additions & 0 deletions csrc/punica/bgmv/bgmv_config.h
Original file line number Diff line number Diff line change
Expand Up @@ -86,6 +86,7 @@ void bgmv_kernel(out_T *__restrict__ Y, const in_T *__restrict__ X,
f(in_T, out_T, W_T, narrow, 36864) \
f(in_T, out_T, W_T, narrow, 43264) \
f(in_T, out_T, W_T, narrow, 49152) \
f(in_T, out_T, W_T, narrow, 49408) \
f(in_T, out_T, W_T, narrow, 60544) \
f(in_T, out_T, W_T, narrow, 60672) \
f(in_T, out_T, W_T, narrow, 64000) \
Expand Down Expand Up @@ -182,6 +183,7 @@ void bgmv_kernel(out_T *__restrict__ Y, const in_T *__restrict__ X,
f(in_T, out_T, W_T, 36864, narrow) \
f(in_T, out_T, W_T, 43264, narrow) \
f(in_T, out_T, W_T, 49152, narrow) \
f(in_T, out_T, W_T, 49408, narrow) \
f(in_T, out_T, W_T, 60544, narrow) \
f(in_T, out_T, W_T, 60672, narrow) \
f(in_T, out_T, W_T, 64000, narrow) \
Expand Down
1 change: 1 addition & 0 deletions tests/lora/test_punica.py
Original file line number Diff line number Diff line change
Expand Up @@ -111,6 +111,7 @@ def _lora_ref_impl(
36864,
43264,
49152,
49408,
60544,
60672,
64000,
Expand Down

0 comments on commit cc6f113

Please sign in to comment.