Commit ba867e6
committed
expose trtllm-gen per-tensor sparse MLA kernels
Signed-off-by: Perkz Zheng <67892460+PerkzZheng@users.noreply.github.com>1 parent b8e6c83 commit ba867e6
File tree
7 files changed
+566
-38
lines changed- csrc
- flashinfer
- include/flashinfer/trtllm/fmha
- tests/attention
7 files changed
+566
-38
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
34 | 34 | | |
35 | 35 | | |
36 | 36 | | |
37 | | - | |
| 37 | + | |
38 | 38 | | |
39 | 39 | | |
40 | 40 | | |
| |||
64 | 64 | | |
65 | 65 | | |
66 | 66 | | |
| 67 | + | |
| 68 | + | |
| 69 | + | |
| 70 | + | |
| 71 | + | |
| 72 | + | |
| 73 | + | |
| 74 | + | |
| 75 | + | |
| 76 | + | |
| 77 | + | |
67 | 78 | | |
68 | 79 | | |
69 | 80 | | |
70 | 81 | | |
| 82 | + | |
| 83 | + | |
| 84 | + | |
| 85 | + | |
71 | 86 | | |
72 | 87 | | |
73 | 88 | | |
| |||
336 | 351 | | |
337 | 352 | | |
338 | 353 | | |
339 | | - | |
| 354 | + | |
340 | 355 | | |
341 | 356 | | |
342 | 357 | | |
| |||
346 | 361 | | |
347 | 362 | | |
348 | 363 | | |
349 | | - | |
350 | | - | |
| 364 | + | |
| 365 | + | |
351 | 366 | | |
352 | 367 | | |
353 | 368 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
82 | 82 | | |
83 | 83 | | |
84 | 84 | | |
85 | | - | |
86 | | - | |
| 85 | + | |
| 86 | + | |
87 | 87 | | |
88 | 88 | | |
89 | 89 | | |
| |||
139 | 139 | | |
140 | 140 | | |
141 | 141 | | |
| 142 | + | |
| 143 | + | |
| 144 | + | |
| 145 | + | |
| 146 | + | |
| 147 | + | |
142 | 148 | | |
143 | 149 | | |
144 | 150 | | |
| |||
201 | 207 | | |
202 | 208 | | |
203 | 209 | | |
204 | | - | |
205 | | - | |
206 | | - | |
207 | | - | |
208 | | - | |
209 | | - | |
210 | | - | |
211 | | - | |
212 | | - | |
| 210 | + | |
| 211 | + | |
| 212 | + | |
| 213 | + | |
| 214 | + | |
| 215 | + | |
| 216 | + | |
213 | 217 | | |
214 | 218 | | |
215 | 219 | | |
| |||
287 | 291 | | |
288 | 292 | | |
289 | 293 | | |
290 | | - | |
291 | | - | |
| 294 | + | |
| 295 | + | |
292 | 296 | | |
293 | 297 | | |
294 | 298 | | |
| |||
367 | 371 | | |
368 | 372 | | |
369 | 373 | | |
370 | | - | |
371 | | - | |
| 374 | + | |
| 375 | + | |
372 | 376 | | |
373 | 377 | | |
374 | 378 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
1922 | 1922 | | |
1923 | 1923 | | |
1924 | 1924 | | |
| 1925 | + | |
1925 | 1926 | | |
1926 | 1927 | | |
1927 | 1928 | | |
| |||
2328 | 2329 | | |
2329 | 2330 | | |
2330 | 2331 | | |
| 2332 | + | |
2331 | 2333 | | |
2332 | 2334 | | |
2333 | 2335 | | |
| |||
2500 | 2502 | | |
2501 | 2503 | | |
2502 | 2504 | | |
| 2505 | + | |
2503 | 2506 | | |
2504 | 2507 | | |
2505 | 2508 | | |
| |||
2524 | 2527 | | |
2525 | 2528 | | |
2526 | 2529 | | |
2527 | | - | |
2528 | | - | |
2529 | | - | |
2530 | | - | |
2531 | | - | |
2532 | | - | |
2533 | | - | |
2534 | | - | |
2535 | | - | |
2536 | | - | |
| 2530 | + | |
| 2531 | + | |
| 2532 | + | |
| 2533 | + | |
| 2534 | + | |
| 2535 | + | |
| 2536 | + | |
| 2537 | + | |
| 2538 | + | |
| 2539 | + | |
| 2540 | + | |
| 2541 | + | |
| 2542 | + | |
| 2543 | + | |
| 2544 | + | |
| 2545 | + | |
| 2546 | + | |
2537 | 2547 | | |
2538 | 2548 | | |
2539 | 2549 | | |
| |||
2547 | 2557 | | |
2548 | 2558 | | |
2549 | 2559 | | |
| 2560 | + | |
2550 | 2561 | | |
2551 | 2562 | | |
2552 | 2563 | | |
| |||
2562 | 2573 | | |
2563 | 2574 | | |
2564 | 2575 | | |
| 2576 | + | |
2565 | 2577 | | |
2566 | 2578 | | |
2567 | 2579 | | |
| |||
2654 | 2666 | | |
2655 | 2667 | | |
2656 | 2668 | | |
| 2669 | + | |
2657 | 2670 | | |
2658 | 2671 | | |
2659 | 2672 | | |
| |||
2687 | 2700 | | |
2688 | 2701 | | |
2689 | 2702 | | |
| 2703 | + | |
2690 | 2704 | | |
2691 | 2705 | | |
2692 | 2706 | | |
| |||
2768 | 2782 | | |
2769 | 2783 | | |
2770 | 2784 | | |
| 2785 | + | |
2771 | 2786 | | |
2772 | 2787 | | |
2773 | 2788 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
333 | 333 | | |
334 | 334 | | |
335 | 335 | | |
| 336 | + | |
| 337 | + | |
| 338 | + | |
| 339 | + | |
336 | 340 | | |
337 | 341 | | |
338 | 342 | | |
| |||
365 | 369 | | |
366 | 370 | | |
367 | 371 | | |
368 | | - | |
| 372 | + | |
| 373 | + | |
369 | 374 | | |
370 | 375 | | |
371 | 376 | | |
| |||
461 | 466 | | |
462 | 467 | | |
463 | 468 | | |
464 | | - | |
| 469 | + | |
| 470 | + | |
465 | 471 | | |
466 | 472 | | |
467 | 473 | | |
468 | 474 | | |
469 | 475 | | |
470 | | - | |
| 476 | + | |
| 477 | + | |
471 | 478 | | |
472 | 479 | | |
473 | 480 | | |
| |||
476 | 483 | | |
477 | 484 | | |
478 | 485 | | |
| 486 | + | |
| 487 | + | |
| 488 | + | |
| 489 | + | |
479 | 490 | | |
480 | 491 | | |
481 | 492 | | |
| |||
524 | 535 | | |
525 | 536 | | |
526 | 537 | | |
527 | | - | |
528 | | - | |
| 538 | + | |
| 539 | + | |
| 540 | + | |
| 541 | + | |
| 542 | + | |
| 543 | + | |
| 544 | + | |
| 545 | + | |
| 546 | + | |
| 547 | + | |
529 | 548 | | |
530 | 549 | | |
531 | 550 | | |
| |||
542 | 561 | | |
543 | 562 | | |
544 | 563 | | |
545 | | - | |
| 564 | + | |
| 565 | + | |
546 | 566 | | |
547 | 567 | | |
548 | 568 | | |
| |||
555 | 575 | | |
556 | 576 | | |
557 | 577 | | |
558 | | - | |
| 578 | + | |
559 | 579 | | |
560 | 580 | | |
561 | 581 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
287 | 287 | | |
288 | 288 | | |
289 | 289 | | |
| 290 | + | |
| 291 | + | |
| 292 | + | |
| 293 | + | |
290 | 294 | | |
291 | 295 | | |
292 | 296 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
486 | 486 | | |
487 | 487 | | |
488 | 488 | | |
489 | | - | |
490 | | - | |
| 489 | + | |
| 490 | + | |
491 | 491 | | |
492 | 492 | | |
493 | 493 | | |
| |||
597 | 597 | | |
598 | 598 | | |
599 | 599 | | |
| 600 | + | |
| 601 | + | |
| 602 | + | |
| 603 | + | |
| 604 | + | |
| 605 | + | |
| 606 | + | |
| 607 | + | |
| 608 | + | |
| 609 | + | |
600 | 610 | | |
601 | 611 | | |
602 | 612 | | |
| |||
720 | 730 | | |
721 | 731 | | |
722 | 732 | | |
| 733 | + | |
| 734 | + | |
| 735 | + | |
| 736 | + | |
| 737 | + | |
723 | 738 | | |
724 | 739 | | |
725 | 740 | | |
| |||
0 commit comments