Commit 934f093
committed
expose trtllm-gen per-tensor sparse MLA kernels
Signed-off-by: Perkz Zheng <67892460+PerkzZheng@users.noreply.github.com>1 parent 54eb341 commit 934f093
File tree
7 files changed
+562
-31
lines changed- csrc
- flashinfer
- include/flashinfer/trtllm/fmha
- tests/attention
7 files changed
+562
-31
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
34 | 34 | | |
35 | 35 | | |
36 | 36 | | |
37 | | - | |
| 37 | + | |
38 | 38 | | |
39 | 39 | | |
40 | 40 | | |
| |||
64 | 64 | | |
65 | 65 | | |
66 | 66 | | |
| 67 | + | |
| 68 | + | |
| 69 | + | |
| 70 | + | |
| 71 | + | |
| 72 | + | |
| 73 | + | |
| 74 | + | |
| 75 | + | |
| 76 | + | |
| 77 | + | |
67 | 78 | | |
68 | 79 | | |
69 | 80 | | |
70 | 81 | | |
| 82 | + | |
| 83 | + | |
| 84 | + | |
| 85 | + | |
71 | 86 | | |
72 | 87 | | |
73 | 88 | | |
| |||
336 | 351 | | |
337 | 352 | | |
338 | 353 | | |
339 | | - | |
| 354 | + | |
340 | 355 | | |
341 | 356 | | |
342 | 357 | | |
| |||
346 | 361 | | |
347 | 362 | | |
348 | 363 | | |
349 | | - | |
350 | | - | |
| 364 | + | |
| 365 | + | |
351 | 366 | | |
352 | 367 | | |
353 | 368 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
79 | 79 | | |
80 | 80 | | |
81 | 81 | | |
82 | | - | |
83 | | - | |
| 82 | + | |
| 83 | + | |
84 | 84 | | |
85 | 85 | | |
86 | 86 | | |
| |||
132 | 132 | | |
133 | 133 | | |
134 | 134 | | |
| 135 | + | |
| 136 | + | |
| 137 | + | |
| 138 | + | |
| 139 | + | |
| 140 | + | |
135 | 141 | | |
136 | 142 | | |
137 | 143 | | |
| |||
199 | 205 | | |
200 | 206 | | |
201 | 207 | | |
202 | | - | |
203 | | - | |
204 | | - | |
| 208 | + | |
| 209 | + | |
| 210 | + | |
205 | 211 | | |
206 | 212 | | |
207 | 213 | | |
| |||
260 | 266 | | |
261 | 267 | | |
262 | 268 | | |
263 | | - | |
264 | | - | |
| 269 | + | |
| 270 | + | |
265 | 271 | | |
266 | 272 | | |
267 | 273 | | |
| |||
322 | 328 | | |
323 | 329 | | |
324 | 330 | | |
325 | | - | |
| 331 | + | |
326 | 332 | | |
327 | 333 | | |
328 | 334 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
1916 | 1916 | | |
1917 | 1917 | | |
1918 | 1918 | | |
| 1919 | + | |
1919 | 1920 | | |
1920 | 1921 | | |
1921 | 1922 | | |
| |||
2315 | 2316 | | |
2316 | 2317 | | |
2317 | 2318 | | |
| 2319 | + | |
2318 | 2320 | | |
2319 | 2321 | | |
2320 | 2322 | | |
| |||
2486 | 2488 | | |
2487 | 2489 | | |
2488 | 2490 | | |
| 2491 | + | |
2489 | 2492 | | |
2490 | 2493 | | |
2491 | 2494 | | |
| |||
2510 | 2513 | | |
2511 | 2514 | | |
2512 | 2515 | | |
2513 | | - | |
2514 | | - | |
2515 | | - | |
2516 | | - | |
2517 | | - | |
2518 | | - | |
2519 | | - | |
2520 | | - | |
2521 | | - | |
2522 | | - | |
| 2516 | + | |
| 2517 | + | |
| 2518 | + | |
| 2519 | + | |
| 2520 | + | |
| 2521 | + | |
| 2522 | + | |
| 2523 | + | |
| 2524 | + | |
| 2525 | + | |
| 2526 | + | |
| 2527 | + | |
| 2528 | + | |
| 2529 | + | |
| 2530 | + | |
| 2531 | + | |
| 2532 | + | |
2523 | 2533 | | |
2524 | 2534 | | |
2525 | 2535 | | |
| |||
2532 | 2542 | | |
2533 | 2543 | | |
2534 | 2544 | | |
| 2545 | + | |
2535 | 2546 | | |
2536 | 2547 | | |
2537 | 2548 | | |
| |||
2549 | 2560 | | |
2550 | 2561 | | |
2551 | 2562 | | |
| 2563 | + | |
2552 | 2564 | | |
2553 | 2565 | | |
2554 | 2566 | | |
| |||
2636 | 2648 | | |
2637 | 2649 | | |
2638 | 2650 | | |
| 2651 | + | |
2639 | 2652 | | |
2640 | 2653 | | |
2641 | 2654 | | |
| |||
2663 | 2676 | | |
2664 | 2677 | | |
2665 | 2678 | | |
| 2679 | + | |
2666 | 2680 | | |
2667 | 2681 | | |
2668 | 2682 | | |
| |||
2679 | 2693 | | |
2680 | 2694 | | |
2681 | 2695 | | |
| 2696 | + | |
2682 | 2697 | | |
2683 | 2698 | | |
2684 | 2699 | | |
| |||
2766 | 2781 | | |
2767 | 2782 | | |
2768 | 2783 | | |
| 2784 | + | |
2769 | 2785 | | |
2770 | 2786 | | |
2771 | 2787 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
333 | 333 | | |
334 | 334 | | |
335 | 335 | | |
| 336 | + | |
| 337 | + | |
| 338 | + | |
| 339 | + | |
336 | 340 | | |
337 | 341 | | |
338 | 342 | | |
| |||
365 | 369 | | |
366 | 370 | | |
367 | 371 | | |
368 | | - | |
| 372 | + | |
| 373 | + | |
369 | 374 | | |
370 | 375 | | |
371 | 376 | | |
| |||
461 | 466 | | |
462 | 467 | | |
463 | 468 | | |
464 | | - | |
| 469 | + | |
| 470 | + | |
465 | 471 | | |
466 | 472 | | |
467 | 473 | | |
468 | 474 | | |
469 | 475 | | |
470 | | - | |
| 476 | + | |
| 477 | + | |
471 | 478 | | |
472 | 479 | | |
473 | 480 | | |
| |||
476 | 483 | | |
477 | 484 | | |
478 | 485 | | |
| 486 | + | |
| 487 | + | |
| 488 | + | |
| 489 | + | |
479 | 490 | | |
480 | 491 | | |
481 | 492 | | |
| |||
524 | 535 | | |
525 | 536 | | |
526 | 537 | | |
527 | | - | |
528 | | - | |
| 538 | + | |
| 539 | + | |
| 540 | + | |
| 541 | + | |
| 542 | + | |
| 543 | + | |
| 544 | + | |
| 545 | + | |
| 546 | + | |
| 547 | + | |
529 | 548 | | |
530 | 549 | | |
531 | 550 | | |
| |||
542 | 561 | | |
543 | 562 | | |
544 | 563 | | |
545 | | - | |
| 564 | + | |
| 565 | + | |
546 | 566 | | |
547 | 567 | | |
548 | 568 | | |
| |||
555 | 575 | | |
556 | 576 | | |
557 | 577 | | |
558 | | - | |
| 578 | + | |
559 | 579 | | |
560 | 580 | | |
561 | 581 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
287 | 287 | | |
288 | 288 | | |
289 | 289 | | |
| 290 | + | |
| 291 | + | |
| 292 | + | |
| 293 | + | |
290 | 294 | | |
291 | 295 | | |
292 | 296 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
486 | 486 | | |
487 | 487 | | |
488 | 488 | | |
489 | | - | |
490 | | - | |
| 489 | + | |
| 490 | + | |
491 | 491 | | |
492 | 492 | | |
493 | 493 | | |
| |||
597 | 597 | | |
598 | 598 | | |
599 | 599 | | |
| 600 | + | |
| 601 | + | |
| 602 | + | |
| 603 | + | |
| 604 | + | |
| 605 | + | |
| 606 | + | |
| 607 | + | |
| 608 | + | |
| 609 | + | |
600 | 610 | | |
601 | 611 | | |
602 | 612 | | |
| |||
721 | 731 | | |
722 | 732 | | |
723 | 733 | | |
| 734 | + | |
| 735 | + | |
| 736 | + | |
| 737 | + | |
| 738 | + | |
724 | 739 | | |
725 | 740 | | |
726 | 741 | | |
| |||
0 commit comments