Index of sw-kernelinferencelibrary-public-generic-local/991e7438224199de85ef08a2730ce18c12b4e0aa/fmha/trtllm-gen
Name Last modified Size
../
flashInferMetaInfo.h 25-Jul-2025 11:13 700.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 396.72 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 392.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 279.28 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 264.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 395.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 390.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 277.39 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 262.55 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 394.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 389.63 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 276.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 261.42 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 305.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 195.91 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 185.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 300.43 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 195.74 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 186.13 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 301.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 283.10 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 198.94 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 180.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 189.48 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 171.79 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 303.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 194.41 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 184.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 299.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 194.25 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 184.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 299.24 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 281.59 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 197.07 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 178.87 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 187.59 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 170.31 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 302.48 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 193.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 183.01 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 297.79 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 193.13 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 183.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 298.23 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 280.46 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 196.06 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 177.71 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 186.72 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 169.15 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 200.28 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 189.87 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 200.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 190.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 203.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 182.22 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 193.28 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 173.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 198.79 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 188.50 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 198.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 189.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 201.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 180.84 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 191.41 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 171.99 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 197.67 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 187.26 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 197.51 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 187.90 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 200.24 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 179.58 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 190.39 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 170.86 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 353.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 350.86 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 238.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 221.66 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 351.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 348.85 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 236.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 219.65 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 349.88 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 347.72 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 235.25 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 218.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 261.18 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 157.78 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 151.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 259.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 161.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 154.44 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 259.97 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 241.98 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 172.32 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 165.11 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.44 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 259.16 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.40 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 257.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.81 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.93 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 257.99 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 239.97 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 170.44 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.93 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 163.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.93 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 258.04 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.63 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 255.87 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 158.43 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 151.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 257.09 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 238.84 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 169.55 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 141.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 162.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 162.39 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 166.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.33 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 176.60 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.01 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 169.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.65 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 161.01 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 154.14 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 164.56 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 157.95 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 174.72 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 167.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.64 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.75 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.88 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 163.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.81 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 173.71 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.98 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 166.24 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.51 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 252.91 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 236.02 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 249.66 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 233.14 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 248.27 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 231.12 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 259.55 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 179.78 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 169.50 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 254.18 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 180.09 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 170.83 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 262.77 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 259.98 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 233.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 235.98 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 167.38 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 160.48 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 160.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 153.23 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 256.54 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 177.02 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 166.74 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 251.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 177.20 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 167.94 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 259.62 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 256.80 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 230.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 232.84 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 164.23 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 157.59 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 157.00 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.46 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 254.52 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 175.01 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 164.73 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 249.15 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 175.19 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 165.93 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 258.11 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 255.28 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 228.99 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 230.83 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 162.83 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.58 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 155.60 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.33 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 185.10 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 174.57 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 185.28 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 175.64 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 299.59 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 282.91 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 171.12 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.44 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 163.74 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.05 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 182.34 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 171.80 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 182.52 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 172.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 296.46 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 279.91 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 167.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.67 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 160.45 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 180.33 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 169.66 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 180.51 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 170.87 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 294.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 277.90 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 166.44 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 154.66 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 158.94 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 229.96 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 222.18 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 228.56 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 220.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 237.57 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.19 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 136.58 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 234.20 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.30 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.13 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 239.82 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 240.96 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 221.66 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 214.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 150.41 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.41 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 142.69 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.53 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 235.55 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.18 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.56 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 232.19 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.28 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.12 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 238.42 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 239.45 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 219.78 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 212.15 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.89 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.41 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 141.29 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.52 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.70 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.04 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 151.47 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.92 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 275.90 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 268.70 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 154.50 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.23 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 146.35 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.11 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.68 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.02 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.46 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.79 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 274.50 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 266.69 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 152.98 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.22 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 144.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 380.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 375.47 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 259.63 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 246.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 379.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 374.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 257.74 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 245.57 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 378.34 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 372.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 256.87 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 244.31 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 288.39 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 173.13 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 162.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 283.00 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 172.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 163.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 281.35 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 264.78 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 174.89 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.07 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 165.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.59 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 286.88 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 171.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 161.45 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 281.49 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 171.45 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 161.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 279.46 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 263.27 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 173.02 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 154.59 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 163.22 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.11 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 285.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 170.53 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 160.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 280.36 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 170.21 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 160.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 278.46 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 262.14 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 172.02 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 153.43 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 162.33 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.07 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 177.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 167.19 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 177.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 167.34 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 179.07 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 158.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 168.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.19 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 176.27 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 165.70 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 175.83 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 165.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 177.08 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 166.99 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.68 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 175.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 164.58 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 174.71 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 164.86 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 176.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.64 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 166.11 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.55 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 348.00 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 345.78 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 229.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 216.50 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 346.11 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 343.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 227.99 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 214.61 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 344.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 342.64 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 227.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 213.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 255.71 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.19 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.46 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 253.25 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.35 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 143.50 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 251.69 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 234.63 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 160.35 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.33 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 151.66 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 253.83 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.80 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.08 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 251.37 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.12 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 249.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 232.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 158.47 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 130.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 149.76 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.72 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 252.57 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.67 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 250.23 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.71 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 248.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 231.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 157.46 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.59 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 151.69 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.82 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.36 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.24 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 164.52 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.91 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 155.32 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.55 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 143.44 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 153.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.86 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 162.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.03 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 153.41 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.55 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.05 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.85 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 161.74 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.90 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 152.54 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 210.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 190.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 209.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 195.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 255.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 234.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 231.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 203.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 228.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 200.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 226.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 198.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 331.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 329.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 216.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 196.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 329.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 326.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 213.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 193.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 326.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 324.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 211.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 191.46 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 237.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 235.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.01 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 241.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 238.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 208.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 215.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 137.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 235.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 130.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 232.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 130.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 238.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 235.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 205.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 212.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 146.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 112.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 134.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 103.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 232.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 230.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 236.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 232.96 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 203.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 210.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 143.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 109.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 132.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 101.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 276.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 248.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 153.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 141.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 109.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 273.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 245.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 150.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 138.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 271.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 243.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 136.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 104.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 145.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 128.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 145.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 137.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 168.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 151.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 172.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 148.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 162.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 142.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 157.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 138.96 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 162.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 153.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 162.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 153.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 182.96 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 157.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 188.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 179.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 154.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 153.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.14 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 172.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 150.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 178.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 169.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.87 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 168.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 146.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 173.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 164.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 167.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 157.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 166.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 157.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 195.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 170.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 192.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 183.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 158.29 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 184.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 165.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 182.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 173.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 154.01 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.24 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 180.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 161.81 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 177.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 168.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 197.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 179.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 196.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 186.43 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 241.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 223.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 213.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 191.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 211.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 189.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 210.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 188.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 315.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 314.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 200.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 182.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 313.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 312.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 198.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 180.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 312.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 311.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 197.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 179.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 221.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 220.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.86 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 223.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 222.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 199.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 202.24 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 139.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 129.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 100.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 219.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 112.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 218.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 221.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 220.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 197.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 200.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 137.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 105.87 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 127.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 98.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 218.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 111.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 217.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 220.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 219.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 196.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 199.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 136.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 104.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 126.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 97.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 257.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 235.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 143.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 109.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 133.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 101.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 255.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 233.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 141.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 131.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 100.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.86 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 254.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 232.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 140.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 130.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 98.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 213.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 194.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 212.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 204.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 253.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 214.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 247.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 208.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 244.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 205.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 262.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 224.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 257.21 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 219.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 253.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 215.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 213.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 194.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 212.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 204.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 151.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 192.75 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 173.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 182.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 163.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 196.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 176.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 186.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 167.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 214.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 176.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 190.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 169.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 141.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 204.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 168.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 181.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 139.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 180.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 165.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 169.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 183.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 168.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 173.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 197.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 164.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 183.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 151.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 128.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 186.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 175.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 131.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 172.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 162.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 162.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 175.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 165.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 166.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 190.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.81 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 179.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 145.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 121.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 180.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 171.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 210.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 187.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 194.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 181.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 199.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 177.22 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 211.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 188.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 179.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 172.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 202.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 180.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 239.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 192.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 214.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 169.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 178.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 185.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 162.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 155.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 228.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 183.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 204.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 161.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 194.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 178.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 182.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 166.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 184.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 168.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 196.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 179.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 168.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 157.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 187.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 171.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 219.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 177.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 206.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 160.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 166.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 165.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 150.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 140.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 208.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 167.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 197.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 186.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 174.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 176.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 157.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 175.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 164.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 187.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 175.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 162.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 148.29 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 178.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 167.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 212.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 168.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 202.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 160.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 157.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 144.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 131.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 201.21 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 192.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 238.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 207.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 213.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 224.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 194.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 235.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 205.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 195.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 224.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 194.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 278.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 218.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 234.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 188.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 217.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 180.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 268.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 208.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 222.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 178.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 218.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 197.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 193.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 204.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 185.29 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 215.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 195.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 175.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 204.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 184.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 250.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 198.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 224.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 178.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 189.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 160.22 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 239.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 188.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 213.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 168.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 208.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 192.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 183.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 194.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 180.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 205.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 190.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 165.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 194.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 179.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 240.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 189.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 219.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 173.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 179.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 150.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 230.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 178.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 207.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 164.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 319.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 317.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 203.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 183.35 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 317.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 315.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 201.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 181.47 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 316.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 314.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 200.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 180.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 223.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 221.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 233.83 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 201.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 134.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 125.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 99.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 221.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.82 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 111.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 219.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 231.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 199.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 132.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 105.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 123.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 97.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 220.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.69 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 110.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 218.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 230.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 198.01 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 131.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 104.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 122.82 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 96.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 138.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 110.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 129.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 102.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 137.01 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 108.76 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 127.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 100.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 135.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 126.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 99.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 136.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 158.63 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 141.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 155.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 145.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.06 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 130.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 153.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 143.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 111.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 141.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 163.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 152.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 159.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 149.11 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.21 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 136.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 157.97 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 147.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.63 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 301.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 299.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 192.97 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 174.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 299.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 297.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 191.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 172.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 297.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 295.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 190.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 171.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 211.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 112.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 209.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 223.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 192.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 131.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 105.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 123.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 98.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 209.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 110.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 207.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 221.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 190.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 129.35 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 103.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 121.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 96.47 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 208.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 109.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 206.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 112.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 220.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 189.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 128.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 102.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 120.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 95.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 135.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 108.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 127.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 101.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 133.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 125.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 99.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.71 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 132.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 105.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 124.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 97.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 128.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 157.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 151.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.69 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 175.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 141.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 168.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 145.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 117.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 166.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 160.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 123.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 153.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 170.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 165.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 140.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 112.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 161.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 157.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 119.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.11 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 141.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 167.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 163.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.17 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 137.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 109.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 159.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 155.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 170.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 158.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 172.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 156.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 160.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 170.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 158.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 146.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 162.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 151.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 187.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 179.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 141.35 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 157.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 157.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 141.17 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 129.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 178.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 143.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 170.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 162.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 154.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 166.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 147.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 162.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 151.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 138.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 154.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.47 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 182.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 175.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 150.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 151.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 134.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 120.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 172.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 167.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.07 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 158.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 163.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 144.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 143.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 158.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 153.07 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 148.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 134.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 179.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.96 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 173.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 147.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 148.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 25-Jul-2025 11:13 131.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 117.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 169.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 165.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 193.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 176.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 179.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 181.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 165.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 191.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 174.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 161.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 181.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 165.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 213.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 174.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 201.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 157.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 178.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 146.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 201.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 164.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 190.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 184.69 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 171.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 171.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 173.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 160.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 182.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 169.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 153.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 172.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 160.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 206.81 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 166.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 197.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 153.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 171.43 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 138.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 194.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 185.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 143.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 180.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 169.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 166.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 168.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 158.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 178.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 167.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 148.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 168.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 157.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 202.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 161.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 195.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 167.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 133.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 190.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 151.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 183.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.92 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 215.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 197.07 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 214.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 194.92 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 261.72 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 243.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 228.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 208.97 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 226.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 207.09 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 225.47 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 205.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.18 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.15 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 238.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 231.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 206.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 200.65 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 137.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 109.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 127.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 100.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.13 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 236.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 229.53 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 204.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 198.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 135.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 125.33 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 98.94 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.01 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 235.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 228.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 203.71 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 197.63 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 134.51 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.82 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 124.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 97.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.43 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.82 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 274.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 255.74 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 141.94 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.00 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 131.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 103.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.42 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.46 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 273.01 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 253.86 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 140.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 111.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 129.44 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 101.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.67 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 272.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 252.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 139.03 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 109.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 128.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 100.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 153.09 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 138.75 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 152.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 138.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 174.38 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 162.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 169.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 153.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 165.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 149.85 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 163.90 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 147.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.04 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 179.53 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 153.07 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 163.60 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 130.18 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 151.58 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.76 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 144.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.33 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 143.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.65 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 176.14 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 149.68 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 160.22 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.15 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.24 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.78 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 130.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 141.90 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.51 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 174.26 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 147.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 158.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 146.28 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 153.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.26 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.61 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 143.96 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 190.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 176.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 168.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 155.57 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.42 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 136.87 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.21 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.57 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 186.96 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 173.33 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 164.85 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 152.15 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.90 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 148.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.08 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 185.08 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 171.07 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 162.94 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.81 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 150.28 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.89 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 201.63 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 183.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 200.97 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 181.10 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 248.02 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 229.75 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 212.68 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 195.15 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 210.94 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 193.26 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 209.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 192.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.27 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.00 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.72 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 222.50 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 220.76 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 192.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 191.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 132.64 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 125.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 99.38 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.27 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.11 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.71 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.32 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 220.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 218.75 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 190.89 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 189.19 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 130.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 104.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 123.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 97.50 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.13 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 111.85 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.58 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.19 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 219.72 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 217.85 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 189.76 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 188.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 129.74 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 103.32 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 122.61 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 96.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.90 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.25 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.00 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 259.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 242.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 137.04 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 109.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 129.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 102.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.89 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.76 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 257.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 240.28 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 135.15 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 127.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 100.14 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.76 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.10 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 256.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 239.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 134.27 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 126.72 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 99.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 207.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 189.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 207.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 187.69 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 254.43 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 236.21 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 221.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 201.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 219.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 199.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 218.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 198.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 321.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 319.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 201.56 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 183.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 319.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 318.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 199.67 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 181.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 318.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 316.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 198.80 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 180.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 225.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 223.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 231.10 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 231.83 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 199.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 201.15 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 132.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 125.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 99.37 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 223.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 221.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.75 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 229.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 229.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 197.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 199.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 131.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 104.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 123.58 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 97.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 222.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.25 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 111.92 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 220.86 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.00 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 228.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 228.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 196.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 198.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 130.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 103.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 122.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 96.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 267.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 248.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 137.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 109.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 129.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 102.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.43 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.67 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 266.04 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 246.74 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 135.42 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.51 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 127.69 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 100.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 130.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 130.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 265.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 245.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 134.41 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 126.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 99.00 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 145.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 130.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 145.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 130.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 166.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 154.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 161.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 145.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 158.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 142.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 156.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 139.81 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.03 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 171.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 145.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 156.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 143.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.21 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.36 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 168.37 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 141.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 153.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.18 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 144.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 141.50 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.74 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 166.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 139.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 151.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 143.03 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 111.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 151.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.68 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 182.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 168.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 161.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 152.31 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.93 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.29 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 179.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 165.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 157.98 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.92 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.61 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 177.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 163.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 156.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 147.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 197.60 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 179.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 196.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 177.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 243.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 225.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 208.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 191.01 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 206.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 189.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 205.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 187.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 302.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 300.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 190.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 173.43 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 300.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 298.75 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 188.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 171.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 299.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 297.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 187.82 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 170.41 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 213.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.75 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 211.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 218.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 220.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 188.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 191.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 131.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 105.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 123.29 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 98.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 211.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 111.87 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 209.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.46 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 216.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 218.98 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 187.03 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 189.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 129.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 103.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 121.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 96.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 210.01 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 110.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 207.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 215.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 218.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 185.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 188.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 128.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 101.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 120.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 95.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.00 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 254.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 237.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 135.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 127.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 100.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.51 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 253.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 235.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 133.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 125.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 98.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.86 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.86 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 252.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 234.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 132.56 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 104.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 124.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 97.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 205.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 188.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 204.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 188.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 230.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 204.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 228.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 201.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 226.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 200.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 240.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 203.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 237.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 201.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 236.51 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 199.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 205.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 188.61 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 204.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 188.08 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 321.65 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 320.06 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 202.63 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 184.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 319.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 318.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 200.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 182.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 318.51 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 316.92 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 199.74 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 181.09 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 225.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 223.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.74 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 232.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 202.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 134.24 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.76 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 125.49 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 99.67 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 223.69 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.49 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 221.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.24 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.86 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 230.89 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 200.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 132.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 105.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 123.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 97.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 222.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 112.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 220.84 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 230.01 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 198.89 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 131.46 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 104.74 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 122.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 96.52 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.42 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 138.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 110.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 129.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 102.31 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.54 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.29 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.29 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 136.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 108.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 127.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 100.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 130.41 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 130.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.52 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 135.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 126.80 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 99.17 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.71 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.13 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 158.63 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.99 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.40 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 143.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.32 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.35 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 155.26 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 145.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.00 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 141.61 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.18 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 153.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.72 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 143.26 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 111.99 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.44 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 151.43 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.79 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 163.39 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.41 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 152.53 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.19 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 149.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 135.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.91 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.40 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 160.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 149.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 147.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 133.72 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 145.91 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.26 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 158.10 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.01 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 147.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 302.76 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 300.74 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 191.67 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 174.50 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 300.75 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 298.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 189.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 172.49 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 299.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 297.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 188.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 171.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 213.14 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 211.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.45 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.06 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 221.81 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 192.39 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 131.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 105.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 123.56 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 98.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 211.25 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 111.85 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 209.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.57 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.18 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 219.93 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 190.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 129.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 103.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 121.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 96.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 210.00 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 110.72 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 208.10 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.44 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 219.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 189.25 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 128.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 102.10 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 120.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 95.21 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.50 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 135.50 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 108.14 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 127.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 101.00 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.76 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.10 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 133.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.26 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 125.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 98.99 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.97 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.48 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.84 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 132.61 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 105.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 124.75 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 97.86 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 216.41 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 196.02 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 215.34 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 200.86 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 260.91 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 240.39 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 237.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 209.22 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 234.65 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 206.45 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 232.38 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 204.31 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 339.68 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 337.94 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 219.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 202.53 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 336.79 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 335.17 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 216.39 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 199.64 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 334.66 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 332.91 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 214.09 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 197.50 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 244.94 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.74 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.83 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 243.20 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.51 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.65 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 247.22 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 240.86 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 214.02 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 219.51 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.98 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.11 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 136.95 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.41 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 242.05 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.98 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.06 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 240.30 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.74 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.88 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 244.31 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 238.11 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 211.15 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 216.62 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 146.11 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 112.22 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 134.05 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 103.65 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 239.78 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.84 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.92 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 238.16 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.61 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.74 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 242.17 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 235.82 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 209.01 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 214.48 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 143.84 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 110.09 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 131.78 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 101.38 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.88 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.06 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 139.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 282.02 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 253.95 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 153.38 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.57 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 141.31 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 109.59 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.12 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.30 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 136.76 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.75 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 279.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 251.18 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 150.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 115.79 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 138.53 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.70 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.85 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.03 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.49 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.62 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 277.01 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 249.04 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 148.23 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 113.55 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 136.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 104.44 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 149.08 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 132.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 149.07 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 141.07 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 172.01 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 155.34 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 176.39 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 151.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 166.08 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 146.26 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 161.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 142.74 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 164.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 154.58 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 163.65 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 154.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 186.62 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 161.64 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 188.62 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.73 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 179.53 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 137.51 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.31 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.34 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.41 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.41 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 176.30 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 154.16 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 178.43 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.47 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 169.34 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.25 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 152.04 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.06 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 151.13 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.26 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 171.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 150.13 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 173.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 134.46 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 164.82 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.98 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 169.06 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.08 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 168.16 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.02 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 198.97 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 174.64 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 192.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.62 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 183.27 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 140.53 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 160.82 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.84 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 159.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 150.78 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 188.64 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 168.99 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 182.57 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 142.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 173.06 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 132.80 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 156.54 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.56 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 155.63 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 146.51 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 184.25 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 165.47 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 178.05 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 138.64 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 168.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.53 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 201.83 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 183.98 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 201.18 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 191.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 246.33 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 228.35 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 217.99 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 196.08 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 216.12 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 194.20 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 215.23 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 193.06 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 322.96 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 320.96 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 204.02 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 188.62 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 320.95 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 319.07 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 202.23 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 186.73 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 319.81 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 317.94 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 201.24 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 185.59 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 228.09 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.89 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.02 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 226.21 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 126.36 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 227.83 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 225.73 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 203.70 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 205.72 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 139.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.74 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 128.95 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 100.50 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 226.20 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 114.01 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 224.20 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.85 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.87 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 225.92 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 223.83 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 201.83 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 203.71 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 137.52 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 105.86 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 127.05 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 98.61 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 225.07 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 119.74 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 112.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 223.07 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 123.72 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 116.74 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 225.05 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 25-Jul-2025 11:13 222.84 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 200.70 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 25-Jul-2025 11:13 202.58 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 136.49 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 104.73 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 126.05 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 97.48 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 127.39 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 120.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 131.28 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.16 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 262.05 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 240.40 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 143.63 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 108.93 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 133.17 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 101.43 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 125.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 118.37 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 129.77 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 122.65 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 260.18 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 238.52 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 141.77 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 107.55 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 131.27 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 99.92 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 124.25 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 117.23 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 128.64 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 121.52 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 259.30 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 237.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 140.87 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 106.41 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 25-Jul-2025 11:13 130.39 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 25-Jul-2025 11:13 98.79 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 218.85 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 199.86 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 218.08 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 210.84 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 258.70 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 220.24 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 253.06 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 214.62 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 249.77 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 211.22 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 268.41 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 230.89 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 262.88 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 225.26 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 259.59 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 222.00 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 218.98 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 199.98 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 25-Jul-2025 11:13 218.08 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 25-Jul-2025 11:13 210.96 KB
LICENSE 25-Jul-2025 11:13 11.09 KB
Artifactory/7.55.14 Server at edge.urm.nvidia.com Port 80