Index of sw-kernelinferencelibrary-public-generic-local/d8c2e4e646bd7e73ea79f06ae52b4ba13adddc64/fmha/trtllm-gen
Name Last modified Size
../
include/ 21-Aug-2025 12:37 -
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 274.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 271.95 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 246.93 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 236.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 271.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 269.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 244.91 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 234.07 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 270.33 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 268.24 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 243.53 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 232.63 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 264.21 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 198.87 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 183.59 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 262.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 196.99 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 182.48 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 254.31 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 244.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 191.45 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 181.23 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 176.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 169.25 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 262.07 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 196.60 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 181.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 259.99 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 194.73 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 180.21 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 252.16 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 242.03 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 189.31 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 179.09 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 174.16 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 167.11 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 260.64 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 195.16 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 179.90 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 258.43 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 193.29 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 178.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 250.91 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 240.60 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 188.07 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 177.66 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 172.91 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 165.68 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 200.06 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 184.19 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 198.22 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 182.91 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 188.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 180.36 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 172.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 168.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 197.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 182.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 196.09 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 180.64 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 186.29 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 178.10 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 170.75 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 165.99 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 196.37 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 180.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 194.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 179.21 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 184.92 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 176.66 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 169.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 164.55 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 232.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 231.43 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 212.66 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 196.64 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 230.03 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 229.29 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 210.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 194.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 228.59 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 227.85 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 209.40 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 192.94 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 222.48 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 162.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 221.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 161.66 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.61 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 220.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 204.73 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 164.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.97 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 153.40 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 138.56 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 220.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.03 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 219.48 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 159.39 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 149.48 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 218.04 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 202.59 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 162.32 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 146.70 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 151.39 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 218.91 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 158.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.60 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 218.04 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 157.95 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.04 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 216.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 201.16 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 160.95 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 150.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 134.87 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 163.15 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.85 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 162.59 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 161.43 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.87 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 150.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 137.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.88 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.59 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.32 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 149.91 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 159.42 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.73 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 147.98 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 159.45 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 149.16 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 158.89 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.47 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 158.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 146.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 133.76 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 122.18 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 117.43 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 119.11 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 115.05 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 134.23 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.94 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 102.39 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 133.59 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.36 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 101.56 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 128.50 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 127.08 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 117.32 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 117.93 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 107.03 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.86 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 99.61 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 88.81 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 131.73 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.32 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 99.89 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 131.07 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.73 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.94 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 125.42 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 123.75 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 114.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 115.55 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 103.65 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 93.11 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 96.36 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 86.06 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 103.21 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.30 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 102.12 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 137.71 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 130.59 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 105.76 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.03 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 98.09 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 87.61 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.38 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 100.58 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.80 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 99.50 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 134.64 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 128.21 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 102.51 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 92.28 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 94.84 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 84.98 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 111.51 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 106.37 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 108.55 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 104.00 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 122.80 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.70 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 90.41 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 121.22 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.75 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 90.97 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 119.22 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 117.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 106.27 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 106.97 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 96.31 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 84.25 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 86.11 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 77.45 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 120.30 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 94.33 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 87.91 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 118.72 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 93.37 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 88.34 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 116.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 114.43 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 103.89 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 104.47 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 93.06 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 81.87 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 83.61 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 74.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.64 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 90.72 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.68 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 91.66 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 127.82 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 119.15 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 95.04 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 83.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 86.99 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 75.99 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.14 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 88.22 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 94.18 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 89.03 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 124.48 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 116.78 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 91.79 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 80.79 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 83.99 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 73.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 253.88 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 252.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 224.68 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 215.23 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 251.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 250.34 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 222.67 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 213.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 250.19 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 248.78 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 221.41 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 211.65 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 244.07 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 176.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 242.55 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 174.57 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 159.66 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 231.94 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 223.31 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 166.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 157.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 151.86 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.31 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 241.80 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 174.34 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 158.69 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 240.41 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 172.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 157.40 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 229.91 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 221.05 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 164.47 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 149.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 143.18 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 240.38 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 172.90 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 157.26 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 238.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 170.87 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.96 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 228.55 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 219.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 163.10 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 153.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 148.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 177.67 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 161.67 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 175.80 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.22 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 163.52 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 156.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 148.70 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.07 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 175.41 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 159.41 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 173.54 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 157.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 161.51 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 154.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 146.57 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.80 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 173.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 157.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 172.10 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 156.52 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 160.27 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.61 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 145.32 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.38 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 223.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 221.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 202.70 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 186.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 221.59 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 219.17 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 200.80 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 184.55 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 220.03 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 217.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 199.45 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 183.12 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 213.91 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.63 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.46 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 211.49 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.07 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 142.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 210.12 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 194.78 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 152.37 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 138.46 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.33 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 211.78 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 149.37 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 139.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 209.36 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.64 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 208.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 192.64 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 150.36 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 134.61 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 136.43 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 210.22 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.94 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 137.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 207.92 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.38 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 139.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 206.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 191.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 148.86 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 133.18 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 135.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.76 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.44 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.90 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.76 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 143.76 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 149.34 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.90 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 137.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.10 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 139.63 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 149.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.49 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 147.33 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 133.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 135.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.96 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.74 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 138.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.18 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.06 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 145.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 132.33 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 134.40 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 149.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 136.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 149.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 136.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 169.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 156.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 163.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 157.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 158.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 151.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 155.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 148.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 183.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 181.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 163.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 145.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 177.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 175.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 157.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 139.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 174.21 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 172.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 154.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 136.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 173.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 132.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 171.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.15 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 174.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 170.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 156.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 153.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 132.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 121.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 167.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 166.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 168.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 165.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 151.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 147.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 128.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.81 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 115.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 100.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 164.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 162.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 165.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 161.81 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 148.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 144.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 133.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.15 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 185.15 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 177.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 129.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 120.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 180.29 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 172.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 124.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 115.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 176.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 169.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 120.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 104.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 111.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 112.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 97.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 112.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 100.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 123.04 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 108.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 142.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 135.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 128.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 120.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 122.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 114.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 166.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 164.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 154.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 153.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 140.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 162.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 150.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 142.14 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 153.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 138.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 124.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 149.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 133.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 136.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 146.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 134.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 133.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 117.81 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 142.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 131.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 168.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 165.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 154.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 154.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 146.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 159.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 149.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 132.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 154.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 140.24 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 131.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 146.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 136.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 134.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 134.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 125.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 140.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 130.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 142.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 124.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 142.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 124.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 163.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 145.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 147.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 138.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 145.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 136.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 144.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 134.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 164.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 162.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 145.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 128.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 162.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 159.75 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 143.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 126.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 160.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 158.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 142.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 124.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 154.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 152.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 157.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 152.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 138.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 136.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 119.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 104.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 152.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 149.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 155.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 150.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 135.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 134.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 117.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 102.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 150.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 148.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 153.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 149.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 134.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 133.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 116.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 100.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 109.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 93.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 118.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 166.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 118.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 103.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 164.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 157.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 116.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 101.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 108.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 94.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 163.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 155.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 115.15 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 100.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 107.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 93.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 153.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 139.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 154.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 141.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 171.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 165.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 163.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 156.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 158.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 151.86 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 182.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 169.43 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 173.81 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 158.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 169.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 153.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 154.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 139.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 154.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 141.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 163.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 198.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 170.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 188.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 161.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 197.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 169.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 188.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 190.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 193.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 170.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 153.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 150.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 152.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 181.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 185.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 162.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 146.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 136.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 177.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 167.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 175.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 158.81 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 166.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 174.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 160.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 143.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 129.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 125.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 165.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 157.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 152.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 122.04 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 166.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 156.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 146.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 164.87 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 154.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 146.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 163.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 149.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 156.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 139.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 120.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 111.46 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 154.96 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 148.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 132.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 218.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 182.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 191.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 198.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 208.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 174.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 216.14 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 180.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 176.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 188.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 207.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 173.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 206.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 201.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 181.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 165.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 180.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 173.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 162.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 174.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 197.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 207.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 172.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 157.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 192.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 170.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 172.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 163.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 183.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 161.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 190.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 167.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 158.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 153.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 182.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 187.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 175.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 169.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 161.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 144.14 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 144.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 139.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 177.58 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 173.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 160.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 178.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 164.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 164.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 146.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 169.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 156.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 177.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 162.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 150.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 136.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 168.58 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 175.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 161.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 165.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 153.46 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 131.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 136.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 122.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 165.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 156.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 156.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 139.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 270.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 202.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 242.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 259.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 192.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 266.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 199.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 226.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 257.04 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 190.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 237.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 251.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 201.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 184.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 198.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 213.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 226.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 247.58 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 191.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 175.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 228.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 189.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 195.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 217.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 179.29 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 225.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 185.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 180.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 215.43 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 177.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 212.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 210.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 188.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 170.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 163.43 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 166.75 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 201.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 203.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 178.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 161.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 207.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 183.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 173.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 196.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 172.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 204.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 179.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 158.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 194.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 170.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 198.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 189.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 182.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 164.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 150.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 144.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 187.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 180.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 172.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 174.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 175.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.68 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 196.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 179.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 178.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 173.11 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 176.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 170.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 175.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 169.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 203.31 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 202.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 180.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 163.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 201.18 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 200.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 178.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 161.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 199.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 198.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 177.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 159.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 190.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 189.33 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 189.11 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 187.35 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 173.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 171.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 128.71 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 114.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 99.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 188.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 187.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 187.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 185.33 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 171.01 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 169.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 126.57 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 187.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 185.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 185.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 183.96 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 169.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 167.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 125.33 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 111.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 204.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 196.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 125.68 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.83 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.97 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.18 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 202.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 193.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.69 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.47 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 201.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 192.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 122.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.01 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 109.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 128.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 114.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 128.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 115.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 138.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 125.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 139.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 133.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 133.68 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 128.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 131.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 125.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 134.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 133.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 150.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 134.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 149.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 133.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 144.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 129.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 143.71 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 128.76 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.76 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 138.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.43 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 142.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 126.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 141.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 126.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 134.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 153.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 146.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 146.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 132.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.71 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 142.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 147.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 141.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 140.81 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 127.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.43 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 142.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.07 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 144.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 138.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 138.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 124.57 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 164.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 148.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 164.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 148.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 185.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 169.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 167.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 162.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 165.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 160.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 164.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 158.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 192.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 190.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 172.07 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 154.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 190.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 188.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 170.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 152.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 189.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 186.83 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 168.69 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 150.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 180.43 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.06 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 177.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.57 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 178.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 178.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 162.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 162.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 125.06 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 114.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 99.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 178.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 175.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.43 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 176.81 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 176.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 160.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 160.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.21 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 176.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.68 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 174.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 118.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 175.57 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 175.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 158.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 159.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 121.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 111.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 194.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 185.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 192.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 182.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 121.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 106.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 191.17 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 181.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 120.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 109.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 94.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 173.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 158.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 173.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 160.33 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 184.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 176.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 180.76 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 173.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 178.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 170.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 195.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 180.07 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 191.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 175.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 189.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 172.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 173.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 158.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 174.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 160.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 127.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 165.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 153.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.81 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 163.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 165.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 153.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 137.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 131.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 116.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 152.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 142.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 118.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 156.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 149.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 143.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 137.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 142.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 156.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 150.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 132.96 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 123.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 107.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 144.18 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 138.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 114.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 139.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.33 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.63 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 138.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 134.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 153.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 147.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 119.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 103.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 140.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 136.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 177.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 162.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 178.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 152.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 164.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 175.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 163.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 141.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 163.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 149.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 176.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.01 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 161.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.97 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 167.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 144.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 150.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 127.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 163.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 149.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 134.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 166.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 157.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 166.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 141.11 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 153.71 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 164.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 152.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 130.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.82 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 165.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 149.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 157.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 155.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 133.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 138.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 116.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 152.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 145.63 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 161.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 154.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 161.96 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 136.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 143.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 159.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 147.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 125.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.81 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 161.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 154.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 137.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 151.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 128.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 21-Aug-2025 12:37 133.43 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 111.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 148.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 143.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 199.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 179.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 175.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 183.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 165.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 195.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 175.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 160.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 182.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 164.17 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 197.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 180.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 177.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 160.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 162.57 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 146.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 183.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 166.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 164.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.63 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 185.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 173.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 162.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 171.11 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 159.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 182.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 169.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 147.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 169.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 158.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 184.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 167.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 172.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 154.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 150.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 133.76 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 169.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 153.63 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 159.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 142.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 179.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 169.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 156.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 164.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 156.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 176.18 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 166.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 141.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 163.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 154.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 178.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 161.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 168.82 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 144.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 127.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 164.01 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 155.71 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 138.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 183.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 168.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 183.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 168.21 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 204.81 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 188.63 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 186.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 181.76 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 184.68 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 179.64 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 183.42 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 178.08 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.18 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.81 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.28 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 197.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 181.66 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 131.82 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 116.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 100.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.67 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.02 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 195.49 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 179.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 129.68 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.28 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 114.13 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.81 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 194.25 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 178.09 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 128.44 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.38 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 133.04 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 118.01 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 213.46 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 204.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 128.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.11 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 114.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 100.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.90 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.74 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 211.42 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 202.43 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 126.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.50 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.47 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.04 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.35 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 210.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 200.99 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 125.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 111.13 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 136.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 122.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 136.58 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 123.66 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 146.36 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 133.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 147.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 141.39 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 141.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 136.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 139.28 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 133.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 153.21 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 137.49 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 138.63 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 158.51 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 142.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 154.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 137.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 136.67 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.40 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 132.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.51 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 132.82 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 153.04 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 137.06 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 149.08 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 131.69 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.66 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.07 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 150.43 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 134.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 146.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 129.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 154.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 138.21 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.72 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 139.36 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 161.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 154.58 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 151.82 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 136.01 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.26 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.63 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 132.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.87 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 133.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 155.63 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 149.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 146.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 130.27 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.89 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 143.00 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 153.15 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 146.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 143.56 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 127.78 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 169.24 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 153.49 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 169.66 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 153.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 190.63 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 173.94 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 172.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 167.01 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 170.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 164.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 169.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 163.33 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.99 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.18 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 183.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 167.09 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 126.47 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.96 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 115.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 100.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.28 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 181.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 164.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 124.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 113.66 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.11 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 180.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 163.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.19 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.27 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.93 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.42 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 199.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 189.69 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 125.19 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 113.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 99.82 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.51 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.65 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 197.14 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 187.57 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 111.81 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.04 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.85 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.08 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.21 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 195.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 186.01 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 121.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 106.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.57 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 174.10 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.37 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 174.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 195.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 179.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 177.36 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 173.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 175.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 170.83 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 174.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 169.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 205.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 204.28 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 179.25 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 163.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 203.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 202.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 177.22 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 160.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 201.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 200.58 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 175.87 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 159.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 192.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 191.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.03 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 188.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 187.04 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 172.97 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 171.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 127.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.90 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 114.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 99.31 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 190.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 189.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.01 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.90 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 186.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 184.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 170.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 169.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 125.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.37 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.18 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 188.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.79 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 187.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.58 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 184.90 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 183.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 169.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 167.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.75 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 106.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 111.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.74 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.72 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.51 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.46 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 204.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 195.87 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 124.10 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.46 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.01 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.37 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 202.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 193.74 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 122.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.15 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.80 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 200.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 192.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 120.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 109.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 94.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 127.72 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 113.98 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 127.79 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 114.80 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 137.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 124.50 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 138.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 132.58 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 132.98 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 127.42 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 130.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 124.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.74 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.82 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 149.60 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 133.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 147.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 133.67 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 118.82 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.92 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.72 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 142.97 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.58 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 144.26 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 128.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 142.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 128.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 143.18 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.97 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 141.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 125.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 139.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 126.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 153.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.87 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.18 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.61 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 152.21 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 145.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 144.86 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 132.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.37 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.28 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 146.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 140.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 139.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 126.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.56 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.58 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.42 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 144.24 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 137.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 136.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 124.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 163.98 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 148.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 164.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 148.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 185.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 168.68 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 167.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 161.75 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 165.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 164.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 158.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 194.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 192.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 170.10 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 154.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 192.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 190.37 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 168.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 151.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 190.80 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 188.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 166.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 150.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 182.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.53 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 179.82 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.53 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.26 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 178.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 178.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 161.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 162.42 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 124.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.42 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 114.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 99.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 179.82 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 177.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 176.28 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 176.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.72 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 160.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 122.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.29 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.86 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 178.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 176.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 174.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 175.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 158.26 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 158.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 121.53 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.42 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 193.80 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 184.43 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.97 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 191.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 182.31 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 121.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 106.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.41 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 190.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 180.87 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 120.26 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 108.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 94.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 176.81 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 161.29 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 177.15 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 161.45 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 198.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 181.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 180.07 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 175.00 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 178.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 172.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 176.79 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 171.44 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 205.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 204.39 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 181.07 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 164.94 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 203.24 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 202.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 179.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 162.68 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 201.68 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 200.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 177.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 161.24 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 192.56 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.83 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 191.45 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.40 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.14 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 190.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 187.33 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 175.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 173.19 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 128.59 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.13 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 114.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 99.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 190.43 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.56 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 189.19 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.13 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 188.85 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 185.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 172.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 170.92 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 126.45 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.99 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.41 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 188.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.90 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 187.75 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.45 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 187.48 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 183.93 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 171.32 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 169.49 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 125.20 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.56 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 111.13 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.83 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.63 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.58 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 206.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 197.91 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 125.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.58 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.57 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.37 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.31 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 204.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 195.79 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.42 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.44 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.69 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.59 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.13 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.69 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.93 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 203.41 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 194.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 122.18 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 106.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 109.32 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.15 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 130.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 116.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 130.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 117.39 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 140.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 127.09 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 141.09 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 135.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 135.57 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 130.01 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 133.09 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 127.25 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 151.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.93 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 152.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 136.47 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 149.44 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.20 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 133.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.04 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 146.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.72 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 143.08 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.56 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 146.84 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 130.78 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 143.72 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.80 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 128.76 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.76 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 143.29 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.97 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 140.21 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.82 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 144.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 128.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 141.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 126.27 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 153.09 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.72 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 154.91 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 148.35 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 146.41 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 132.80 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.59 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 147.27 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 131.43 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.31 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 130.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 149.43 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 143.20 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 140.81 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.75 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 127.06 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 144.52 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.56 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.57 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.41 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 146.82 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 140.47 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 138.20 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.00 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 124.57 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.56 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 165.27 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 149.65 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 165.82 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 149.71 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 186.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 169.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 168.65 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 163.04 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 166.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 160.92 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 165.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.48 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 194.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 192.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 171.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 154.80 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 192.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 190.48 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 169.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 152.54 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 190.91 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 189.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 168.10 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 151.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 182.07 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.32 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 179.80 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.37 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 179.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 179.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 163.25 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 163.09 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 124.94 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.54 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 114.32 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 99.22 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 179.94 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.19 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 177.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.10 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 177.57 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 177.33 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 161.13 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 160.95 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.27 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.41 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.09 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 178.50 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.75 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.94 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 176.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.95 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 176.33 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 175.96 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 159.51 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 121.65 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.84 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 111.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.65 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.13 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.20 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.45 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.22 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 195.21 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 185.84 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.75 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.39 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.42 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.99 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.93 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.31 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.95 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 193.17 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 183.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 121.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 106.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.29 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 121.44 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.50 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.52 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 191.93 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 182.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 120.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 109.01 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 94.85 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 153.04 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 139.84 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 153.50 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 139.93 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 173.61 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.78 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 166.98 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 160.86 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 162.15 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 155.20 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 158.95 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 152.02 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 186.95 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 185.74 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 165.58 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 148.87 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 181.05 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 179.85 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 159.31 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 143.59 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 177.88 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 176.67 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 156.29 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 140.41 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 177.13 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 133.93 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.97 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 175.93 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 132.03 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.29 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 177.71 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 172.38 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 160.51 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 156.84 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 132.64 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.81 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 121.59 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.71 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 171.23 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.30 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.07 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 170.04 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.41 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.26 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 172.15 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 167.48 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 155.18 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 151.55 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 128.16 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 108.95 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 115.48 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 100.84 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 168.06 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.00 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.89 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 166.86 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.10 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.21 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 169.08 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 163.55 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 152.15 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 148.51 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 123.80 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.89 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.64 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.66 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.15 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 133.12 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 122.72 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 189.55 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 181.55 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 129.38 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.57 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 119.83 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 105.12 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.62 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 127.62 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.82 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 184.68 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 175.77 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 124.92 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 107.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 115.41 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 98.69 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 126.22 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.45 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 124.32 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.64 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 181.37 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 172.70 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 120.79 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 104.06 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 111.37 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.48 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 115.52 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 100.24 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 115.42 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 102.92 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 125.69 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 111.05 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 145.43 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 138.01 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 131.42 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 123.47 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 125.30 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 117.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 168.51 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 156.78 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 166.01 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 155.52 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 156.34 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 143.16 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 162.43 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 150.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 150.66 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 142.14 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 154.93 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 142.57 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 152.14 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.31 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 141.29 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 126.78 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 149.98 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 134.08 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 136.54 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 125.30 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 148.48 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 136.51 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 145.70 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.24 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 135.70 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 120.46 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 142.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 128.17 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 130.94 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.38 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 169.85 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 157.38 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 167.22 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 156.23 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 157.02 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 149.28 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 159.30 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 141.79 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 149.10 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 132.78 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 156.15 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 143.16 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 153.36 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 142.02 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 142.89 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 134.41 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 146.70 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 129.39 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 136.50 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 120.26 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 149.70 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 137.09 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 146.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 135.96 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 137.02 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 128.38 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 140.33 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 123.29 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 130.01 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.16 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 143.37 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 127.55 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 143.24 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 127.14 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 165.11 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 148.27 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 147.64 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 141.16 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 145.49 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 139.04 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 144.25 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 137.48 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 167.73 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 165.41 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 147.56 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 130.78 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 165.59 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 163.28 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 145.53 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 128.65 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 164.16 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 161.72 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 144.18 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 127.21 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 157.80 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.07 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.89 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 155.60 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 118.39 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.46 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 157.78 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 154.84 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 140.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 138.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 119.73 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 104.36 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 112.41 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 97.52 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 155.66 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.94 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.63 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 153.47 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.25 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.20 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 155.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 152.68 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 138.62 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 136.74 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 117.70 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 102.23 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 95.39 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 154.22 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.50 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.20 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 151.91 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.82 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.77 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 154.51 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 21-Aug-2025 12:37 151.44 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 137.17 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 21-Aug-2025 12:37 135.18 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 116.48 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 100.66 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 109.12 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 93.95 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.99 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 113.33 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 119.30 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 114.31 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 168.97 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 161.85 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 118.53 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 103.66 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 110.63 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 96.48 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.73 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 111.19 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 117.05 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 112.05 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 166.93 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 159.73 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 116.52 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 101.53 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 108.49 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 94.34 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 116.29 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 109.62 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 115.61 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 110.49 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 21-Aug-2025 12:37 165.69 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 21-Aug-2025 12:37 158.29 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 115.02 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 100.09 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 21-Aug-2025 12:37 107.23 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 21-Aug-2025 12:37 92.91 KB
LICENSE 21-Aug-2025 12:37 11.09 KB
Artifactory/7.55.14 Server at edge.urm.nvidia.com Port 80