Merge remote-tracking branch 'origin/main' into feat/b300_cu13

Signed-off-by: Xiwen Yu <13230610+VALLIS-NERIA@users.noreply.github.com>
This commit is contained in:
Xiwen Yu 2025-09-10 07:46:25 +08:00
commit 5f508b7d43
2794 changed files with 5356 additions and 7498 deletions

1
.gitignore vendored
View File

@ -7,6 +7,7 @@ __pycache__/
*.npy
.VSCodeCounter
cpp/build*
cpp/Release
build
!tensorrt_llm/bench/build
!builders/

View File

@ -263,6 +263,7 @@ struct AdaBlockwiseGemmKernel
cute::clear(tAsA);
cute::clear(tBsB);
cute::clear(tAsSFA);
cute::clear(tBsSFB);
int k_tile_count = cute::size<2>(gA);
CUTLASS_PRAGMA_NO_UNROLL

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:2965edaf6cc339fa943d7761c55f2b1ef670bb16359aaa9fd5ab6f7107bcb099
size 802287

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:8e2f7f42b15d8e57c0916c95bdb1ea392d23864f9c7ed4a34f800ea0c7605b9b
size 715155

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:bf63599cd1a80e9d8c8a1f0acf1f4e17a77cfd9a8f2d5387553c3f0a292042e9
size 804209

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:df223168d786a4aac8157a1ad45a49607d59979642af46721c9b726f4f8caea2
size 715005

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:b4193e65378231a52150069dd334ced0e2ad28f26ea4aa240a38aefad0209694
size 869511

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:bc32a5ef013f3d11cec5aaae7b7c3ac3785077527c7bf0882d0ad8861920ffe7
size 781787

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:278b07d4a0263b5099c9fd3b10653555fdb60fa525e2fb142bcb70e559b97ad3
size 859021

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:75066cdda0d5d29dbb3f2d67f32fdeecdf3536988b678200afd402e9149cb645
size 815157

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c54783ab08298a5c54c4655c4b2feae8cff627a68093d1f6b6b277becb738005
size 837661

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e8f051c4cbf5d10eb7ab75e0470f125440566c1eae81e3f0d48c9751113d6bb7
size 794041

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:13efb64efab5b77fb128fcecd4f4742fbd5aa24c6e05b2c643af81d6d5f25101
size 932265

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:ae43c318177f77aa2c805ddc649fcb65156f842a90f944fc84b372417bb7a9d9
size 912031

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:bdb66828906f1bb711aac3c7852da69bc17f2e04c1d980269bff8cd275132ea8
size 891249

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:3bb119c52675eb06374f3641580147ff9d19292a58a8a5883b5aa54892749035
size 768647

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:53f4e690488da700dc4e1d0f5d7133953de8d26f22f6f9564458e228687ba863
size 907745

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:cd83b513897c9e614c9f4532edc3032ef5ed1e6a6a6bf85aef3facc93602452a
size 890917

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:87e290474b855509bec65400f1497d22b2752db7f943fed646fa78c4c062112c
size 870479

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:35169252febd1930bec78f3612f021ab3b2a2c72fc6d16b306cf0aed4ef92e71
size 746941

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:2f56763a3a99fbdc212394eaddf29acf64741061d749aaa140f8c51240df3331
size 760481

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:cc0d08623a92ef6b30a1143e88ce3a68702dfaa5c2759b9675562361372c3cd6
size 693583

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c2644cfe62eec5b07dd00b7d9c45a7a1fece1cc4275020d86ad05729f0be6732
size 758503

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:736c138936e47814ebe158a5fede552c273c296eaaf7b24ec5eb3bf30deb929e
size 712621

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:48607a3f5eab809128ba8c499e417c49d3e0ce96b988076bdf3df599ee2cc310
size 933069

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:65b0e7a3477041166c985b37245268af6a93817213cb8acc473ae4d6753cb816
size 815747

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:fb3b9e408f9257507d629328a63ac612a5cba6b6e10ef4245d5821fd3b15b8ce
size 772401

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:b52641a6f5bbe6b6edd2cb68c9131395ccb584f00e71dce8833db29beea95df6
size 645457

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:ff3533ac50531779449af26d8f7e38779dae64d7801cee52cca845be1d1e43ab
size 732537

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:a780e7277bab1bc72abfd50814b51bc945c9ba2f27c097ab1e8808d8ab6ac048
size 608652

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:29cbde30d12651659d467513fc336cfab0a3b0b1df4ac8740509237d33525f6f
size 733941

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7a3745618ddb4868e5d0aed1c50c7bc44dc35a908e431f1a3d7382bdc8790fbb
size 669263

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d2603e61d4b871143c4179b6421e4429003e3371940b87a0c05f7d4a459eb1c8
size 733491

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:447a4369e477d58d4c5a55fbbf34079ec81cd772fea907c4e0f13a112970decf
size 688397

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:4ab2e6119872b837377d731ba6bd79cf1dab366cdcd327f2f59db27c6ae87521
size 907859

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:28dd68f28334d802cb6024bcd774b67a8ed5c220888c6df8dc9728fff86090d0
size 795421

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e0975ff752916b455a4caab13cbc7c6e114d960550ff523cc51e8f4b2f64ae0d
size 744921

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:53568ff3ffec76cb2318374475e091d3cd6d13ea0f6471748a8d4895e08ace14
size 622961

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:3a6d1547fa1b1c1c2cc05f7db31093ce1a6b9dcabfc0d5a42acdb537e560e525
size 705009

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d3c2cf6046e503089287ef03dff38c8c3da1e45090053941a3890b933c97bef9
size 586946

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:44ec5327cc5dcaf725ea96224fd3b5f0d859c55cb93e3041dff9595871e3d5d6
size 762045

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:3bb6fa859bbda96f1d8d17911d26c7344b5354470e10423c7f2f243470db44f7
size 709059

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5fee8d3022d67993a8c8d35d2450a79b989619016e85d732e31e5b4062ac31ac
size 760509

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:0beca5d6f9edd10678e63a469b1b3e611b484af8344916356000f04ccbb246e1
size 713739

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:287cffb13918406c88998a4cdf2c993d6b9104291afd64b64ed72412e5f40e3a
size 930143

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:952ed686eacad9c665244f2adc4c990b134577fd08a281f39174bae8016013e7
size 885587

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:17fb12053fe5b135ef481efc01246a426c305c554c20023122ec71dc96ba70d7
size 744857

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:69168f547e2d24a9563a496ce6ef5a0ed51968c375caf9b291411122b861d6c4
size 646331

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d687aa2ffae8970c8cf9203dae6f11abca9c9a046412f298fc7ddabc17aa9759
size 704205

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7cdfc83f8cee3d72b0606922796d759fcb3a847755f9ec3b081985029bf9292d
size 607700

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:02ce62644ca9fa62627a99d6bbd31d3155033d0fb07480a378e51f018e5c7fc0
size 735947

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:980a31504abb1bdf83356dbff08bedbaab7754524f58cf9bc54f066042a1c8d1
size 682961

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7f1718629724edd44b9f40c25d0ee2f7429536dddbfdd7332d1ec29b7aa60e17
size 737077

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:8dd7faa7e726d7192abdbc5f2372caced4d2bbe3d25f0aaac4afcb3c9258177d
size 689517

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:3efa010c342126d1720693ecd219820598da6494b1d61c00c49d4f8d69706898
size 909571

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:39a7c0a8feb3fa19cdec3230217e0a61fb44c8319d268c187b241fee894473fa
size 865261

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:50ef93f1de66f76d3500d328645c6e97f6d446ce78ceaf6b63e4f2200df84bc0
size 718957

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:be6390f8441a42cd10bd40e2645de18fdc6bb28b3ee76f7470c167583f3b14f2
size 619543

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:dcf45a6051c7d0f7e7a7ea0e89ff3634b7f9c5c26de34c055c916f1d03cd555d
size 678305

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:2a78635e03f895eb255c3ad7d32726c0a70862c8e13f80118b105c125932794e
size 581800

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:36f9d3ab3565e73f13c1b92397b42cac3bb9aa96cba7dab1602bcfe542c940e2
size 726461

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:4b1c5f27dea83283f7fe75696d0cac728d2c35ed94350adf5c3ea7bca1e6415d
size 625961

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:882b2b0bf568bc5aebe2b5c00aaf03fff09db5e9740a9dbcee24a7fd7ff4b5a4
size 723499

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:ae9ac6da80b2ca2f75515fc6ea4277d0fa985deb8d42901a526d807e794d393c
size 643373

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d8039f3c08de676a2ef0a8a8a789e072d6b77fc8e62fb04ea66befe6794726d5
size 793833

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7326a031a7c5e2d9360e968f63234246f640d39cdb855a8acb96bedfcd91f673
size 693629

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:a5364e3514edc4fc6ebb6477e7fa485f6d31f2586846114cedd0ea74d9bc95fa
size 844025

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:07a27de9c373c7bd7fb94ad2b59f269d8848c291c79c0eb89b6476551d1a7091
size 781857

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e20332bea04c1c2827943b288711edaeac53ed734b79abb93375b4629377044e
size 794149

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:405b64f6b5ced2d9c30f4a86bc3bdc5e8c5201465d3d714ee27335c1180bc95a
size 738985

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:856e0f97a8857c02f5107b6a691c7eec5d009ffd62ab7d4226676915185c0fb8
size 935615

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:9731feccf13bf37c39c75214d80818fa19c42a8076d5cee6644d1cc21a09280b
size 870937

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e9238fa8a3afd35ada586ddc8d1cea328d1c6c7c49bc20a713b7710f2019c08a
size 928703

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:389558a2d55a5f9413a6386703292526f911528c784817519a2bb2651662746c
size 890073

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:22331ad4f929f0badd2adf1af886322f5554692b2c7c055fa6c77f6231fb6998
size 909537

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c6bedc0179ff9579b1ed2a052fc1060443145a2f7a114bd2a3f5c3a5cc48156c
size 802969

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6d94f95ab619b20bbe52e63fb58cb7412221d0cf309bd841c993f54a3707930d
size 923705

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:adc22390588199d8327a41df9cb0e8c08cfcb493f76c7004320880168653593f
size 832185

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:8fac98081b5ace5fbcc681d257ee4e75ee20755f50fa24dcd7a306f25f0ff1c2
size 878515

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5370d76e9d2f16e1dfcff8c02e2f26a26bb121d9d6fb139ad06acd53d9c33d3b
size 778507

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:0f12026c102d1f5829eea7e7f8a492ffe0fb7c671944be92ca964fde71b9cde2
size 887317

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e55586934b9e9e46d0fc17e897475a28d33a8b82c26f1b1f16fe4de1fba6690b
size 824415

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:321330c0a03df99dc265fee7e5e3ca115727cd08a938f50952cfeb53e2d0c345
size 881145

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e53f7bd8cda39f0db32f30f9aee78488c386a1794035881bd2921df0459baa64
size 843255

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:dacc54c060adf3edca87d4a93c8d7d6ccea0ad62ebca94f7bbdad042dc45d53e
size 863065

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7488cb568a777e37fbaeec65157ffc42639145ed7e91d0ba599c952d4a233415
size 759605

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:48530588ddea30fc7f28646c852ea512ef1aac7d9189f82302b9f2bb079e8efb
size 873781

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5ba08f8146c255e2c5549a65d84b493b0c62b65def4266254bb12153fe9fc510
size 781273

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:acd59c13c0417c159f68329559aa21647074d0dd126a009cda56a7cd984ebb39
size 828589

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:fb47de952feeed9dbf15af8f8018c919a29f499cbac668c620d83311a2397906
size 730111

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:be0111de15798470a3177067bf92c3f5c6eb7f7cd6e960b75915cc74c13e2766
size 939053

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6103b066ae747c45cf1dbc3c13d613f273914bcef4237072980e9f914a7de7d9
size 891691

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:2480a24795437746f6a2312d4fd48469a32dbe096587dc84a5cd9ac375d2e34d
size 932683

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:aac0e673afa7f4992a411383d48d61db010fcc8f131b24af08c93c773653a475
size 893115

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:9c2a5fbdc69cf8598f23d5a549fa027b8f83228fc8a54abfb56b158e660d3f7f
size 911889

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e6549cd82faa228f65354021a08b35cff4d59cfa303184a5d12b3eef00978db2
size 848883

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:78fd2043ed0684cfb1e78438e575ec25a3d1d565db7068605a827a56c4227726
size 895373

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:f6b2c4c13645f43178da8f78d7ee548f0bd6d9745247ee5fda241671be666c9b
size 787819

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:1cf4126e5b125b413be2f5cb723de60f97f1f4d4a36efc25df6e935c38119038
size 848505

View File

@ -1,3 +0,0 @@
version https://git-lfs.github.com/spec/v1
oid sha256:50fe1a044be2962e0e7c555af8a14e84622ee272d394a273d43ce0376a9227d0
size 745981

Some files were not shown because too many files have changed in this diff Show More