[https://jirasw.nvidia.com/browse/TRTLLM-4645] support mutliCtasKvMode for high-throughput MLA kernels (#5426)

Signed-off-by: Perkz Zheng <67892460+PerkzZheng@users.noreply.github.com>
This commit is contained in:
Perkz Zheng 2025-06-25 16:31:10 +08:00 committed by GitHub
parent f3cfe86dd1
commit 1f292ff2a0
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2922 changed files with 7493 additions and 10077 deletions

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:0a3b0b0d4aa1414c48c4cc39cc33855343b204bc4bc1dc65ea545e934f9659cd
size 1340171

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7dcefb2233db742e41ef20641e5a82dbace28be552a59a3dd29da7c2cd627f9a
size 1209973

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:2ad04f87a1bdf10813d04b4369e6a6a534cbc49d798e95decde3450db928688c
size 1336765

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:3f10b97c08a567ebd5525aed3e4074cf2523c8386e315e62703ab6be1cbc94f5
size 1243073

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:cabf85db75d3629d804dd2433195797206c74424d822c6e6b27b4b44454044b5
size 1621995

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:802b694bf10314251d0ba5d011bfbfe876309966c4367fb84b7445aceda4355f
size 1491353

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:56d221da3f284bc3d67ffd76148b9ad553da5e901397681423d1050f22d55c6d
size 1457439

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:0d13eae9e61ada7bb3d0b44c09270f300c768e107cdbf88d4a89fe0905702c01
size 1278991

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:cde7cb08354f7a120436798e7b8c92cef87a795a77d78be0cb46cda936dbf017
size 1443131

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:edf9438819e6f1f345e139821db7ede22de23625901bafeb924c50d6173e5218
size 1265475

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:1a366993a58705a9fba929f41c0523d2ada4a453caa99913e6ed0f7efd3f97b0
size 2079437

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:4cea7efd4f53a895e4c2ac0d7c4d7f083c7fb82ff9caf8b3ed69421606bfc45e
size 1361615

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c7f3221edcb2e0adbd12dde1fe347c12785b6e4535c8c6d574a75faf7baf4eaf
size 1259487

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c8faf3b8275e7ed6476dc5f6acc60a9a67339390447d7cc56b32da6f35741b8c
size 2065969

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:60a5c2f89f2957ffddf47913183e693354bc66a2a872199c41ba2105a48e3732
size 1347111

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:eaa45d201e6e116cd2c28e82fc31cc43f3bab5ffdf45a0a02e566ea58604b7b0
size 1245231

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c5e6bb3d4d79ea7a0a02c597ec8ce71e1cea03c54884036522dbf2becd2dd500
size 842129

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:efbebcf006a0ea80452e3afaef00878676cc9b1801d934563c7801966f39ca09
size 760579

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:f07b920452d10d56220f00f0a3e3595ce0e9ebc576195f631eef23551de4fd0d
size 837467

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:2d1ce1b5b4c55ec0c8339b7f7cdc76b54c27cfb27d24bdb51a039d0b712c8fe6
size 777575

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:cb564b9fe672017e94d9b078daf76a991a9904eb62d250865494ddda5920ed81
size 1523099

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:bdddbcad2b98d0e1fb73cf69a6fdb869611135b6caef9e067b046adb479ba0d0
size 1311205

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:0e2fd02e1558936277192929c037dc58fa40426c83cd7780b816f3dd43ba7013
size 935815

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:b1a23dc8b75c8e4b866b4e68d28ed86160d1fe6a10cd74cc9f2d38d111c3ea56
size 722095

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7c8d469df6957c2015ac904de69193ea1e702072ef8a453e95db6bc232a54f13
size 862553

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6d4b8866ffcab80634a9ae1234d279607751b7c3d7cd0dcafb5e39ce78050063
size 670935

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:9586613c73e23e9c5a2ff4cdfea3ec716d42c40bb855d388c9a2622a6a022604
size 827821

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:18d71e3e3f63efa2be0f26fc20e92195991e59a7322a22ea4bff7080b2f3a22b
size 747061

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:53c0a9929caddb24462cdaf70f5bb6d1d5da7db76a0412e352066e476845b0cf
size 823161

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:62120a9cb7ec8e7150784127608eb2e4bdfd5611d1990a55e7709823441164f9
size 764057

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:ea6cccecd27b216f4e91e4435852067afaf2e2529780c798e4eb5ccf9e83da49
size 1508941

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:1fe5b16a2cc91187a724cf4b790f0a0311d679e26c56174ae19b16300deed44c
size 1297737

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c305b0bb0ad120c12ded43b4b589e704aa3200cbf20c33142a5ad23c5f593fb5
size 922199

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:852d2010d2203212db9cc170bf740024b304df29e9cfd3e7821737f753681a9e
size 708579

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:9330bad32fc42b2bceae16048608768596092bad1c66d8984b70475dc5f22290
size 848297

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6594182f0e0adb4d7091327d513755646c44be9c8f0b62b5e97b4340792ed446
size 656677

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:2546252b8f6540828813d44c9fca44d6e8384a2ed66da968d9739ec2b75ac55b
size 1739263

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:9c9dfaa100085af6cd96c498bfbaf7b179e6cd40b927201ec1e2efb3455a9306
size 1560667

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5d6dd8c662b042e64df06f447e874dfa588a629ba64c2e088f3a3b80f8992513
size 962193

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:1ef7e88e94fb9c9ed33b54a7895d63c340e13580aaf47f6fb4e3b49294ae463c
size 743985

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:a483de6bc0e0cb4c2b949dc0f2dede69694f90f95795dab4459bb824b85e10cf
size 888537

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:879075df65c0856b0254372d1e20bc206ece4c2c87a59c640b5bf9ae4adc4f2d
size 689765

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:93f71d615cdc26146445b63a570892493a1a49b1a736057fbe76d18f68d34fc6
size 1724955

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:68fdafcf62ef67b510965164507b465e3162ed405a6f07748a465f9ecf20e322
size 1547151

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6ab78b1c07f6e4dbe30755d495ba9498176a62a7104d3f2d670376e5e2aa3d67
size 948577

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:2b7b1044ac5a3b5d298ff819dafb3231be6b7729124ff33383398d0e2c4290aa
size 729777

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c7acf3b5a8b620022f8068b849c85a9c3ace0ee89cd7a98e44e209b41869df3a
size 874231

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:520cfa9758ae13d6b2174f63ce243a6f694500c45bfa75ead03e2c37c725557d
size 675459

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:aa4d0b53e3bbece2829484770be396603a7e03cfe4a784037027053b8691fc9d
size 1353689

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:15283dc59c477b94bb315ba92f634864e50a46bff78c910750bd70439ffc3bf7
size 1233553

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d562f7b44c7113b397d9980ec9b9b6f5d7fd768603d696a9861686853f32b703
size 1349395

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:ea1871afbe89cf566dcd7c84261f9e9c3dbb3fe87254da0ec6494f045190e746
size 1302569

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:ade3537b6709070ed451c71e57f6e7199179af35b2e091982d9af82de2c37369
size 1569919

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6c7e71ac8ab8d8db4c71b5559255d54428a87940995ac58ade9f46af2a5ccc21
size 1330151

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6d49eb5e5f9a26e50db96759118194f50831b6e8141c5dce11e5bddc5c28a5e0
size 1549149

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e97370786f5166a885387343fd35e71a531d5736e28736615b0a8d65b0dc0ee1
size 1308691

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:de65cb33211580f6107044e6ee390d5cfad17c1f811071ea8d798616b1ab2fac
size 1636369

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:b4bf16bcaef1fdbfa5a4e3d873bbee35af8fdd372c1b8b88514e5d73c608ea87
size 1396009

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:71e60c99dd66797323fbb19ebc951eef6acfc8734333c45dfd6eee5df6b3b69f
size 1615649

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:f59ec987f9b7b140fb1f14f8658094e8efd2b0ebb06a56635c207da528f789dd
size 1375437

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:bc0caaf9e29b773e90236e0b2105e8ea6bf6227b73a8f58d5056182b4a890d45
size 1354481

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6b21669e6da3508dcd0d9666fa2bedcc65fb5aacf211246782778f56bbaa5ce1
size 1234347

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:82e12b495e381e6f86d691db40bd1594b4c0307cec2ec0f81437788bf6d9f6d0
size 1349399

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:3a6281821b025119840644d399806ca03fada277f13827fc76ecb6fde8d1f228
size 1302573

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:420a2a1b009a357a777bd833c593f7d129db193412119ddbbb795df1b1068612
size 931001

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:4a0b8b94ac35e8fcd8c5e379ee62e3c1b27e41bde2dc3b2687c2787a58484c6c
size 826899

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c6e7395d3c9ec8063bee6d1720a085ca00aada14fd09b82a57a6fddeb6d721ac
size 931245

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:199baa2d592fddd4302f02fda25ec0244aa9abbe9d5a6a86dc474005f3daa2cf
size 880473

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:554b0d0be1eee57a424a778543c4a371c9a41bdf68e1ec0a8a3a03be17de39f3
size 1075777

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7bb67b7677bc62b856f54e0df91a30c63bedc9dfa5ec4b1fb5d4bdf7a94f059c
size 970837

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:fd519fec82eb9985748e924772a9e81c266dee0711aa4e7532b5927b509f3c4c
size 1037957

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:861e37785283353abba23aead6a6b0d4e2fd1af042de33cf62c0fb0da68078b1
size 915059

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5bf80d63bc6a97e62cf42b078339e9b84bd077bf144395b61a88d5b265a3f83d
size 1010183

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d5cac326a082ef431fc00f15648f75611e0cefc42a66d3e56227ace83c07824c
size 892811

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:b87de96bb0d184b815b3dfa35f883fbb4c93c444f370af38e848a14d61fde559
size 994421

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e5ecd4069093bfc90bedab6fde83899785c6c7948217475d6b6a0c0e356f2945
size 933689

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:bfafc749c1741d73a7b705cb76119faa12d6119f9dd3245d0d06132b984ac10b
size 987095

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5f778d73792656708d79c25e8018b28e83358a75b760a41a0bf03650a17c87ee
size 931741

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:76e08b737a378c747ec82628b0fa70d758fc7b0ce143934941502ec2cf11098d
size 1107121

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:432112568f53df28981f14176bec8ec9c83bfcc1a18bb20815af3d859c45ccf8
size 966265

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:1e85bb54081cc755560460b2cde105781a8805d96944ecdbe72fc567b5929a6d
size 1140993

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:f9379dcc020c943ba6ff2dd85b2b386516827f524886fcf573b7591de4c66409
size 887559

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:827d5a0e962ea2212ff04c760d880bcdd1f42a3dae69b27d390432a65d845e47
size 1086725

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:12d9e958aa4d413ce5abe403370ca3bcf6cbcc81ea89632e936271df9176e30a
size 833193

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e1abf913df86e7b2b65c848ef3f96e7e7b6670b3c89162a70f84ce57bb92c317
size 968225

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:8a67d28cbf7ad3c673c806a0a538b2b5f1ea8de42649c692b91b352bc8bf4db1
size 907493

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:bcdfde51a2faef784a72b504baee9e5fec315e9a6a5237919a6ae3641c55e5b0
size 960209

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:af4c5ec2d8bba7960c9c29e956dc04bf0c21f4615ab29d6438d9a1ac02dd0b95
size 905545

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7637d60fda4b169a2bd3d503e77c21cc58cff93a1f879f013d80cc2252e4d73b
size 1078457

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:1fc1c1494d2d191407f902daf58d4d1b224d8f97fd38f92fa4c54d1697226da3
size 940859

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:b267058f2b58b8ff638329d94fb20642d98b3a4b1977abd30882b56352ff34f6
size 1113267

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6afb05b7a599457e0ee89dff099974c2064216cfe008ede333e8b1704bf21800
size 861463

Some files were not shown because too many files have changed in this diff Show More