Index of sw-kernelinferencelibrary-public-generic-local/d25901733420c7cddc1adf799b0d4639ed1e162f/fmha/trtllm-gen
Name Last modified Size
../
flashInferMetaInfo.h 17-Jul-2025 10:59 700.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 397.54 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 393.09 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 280.10 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 264.88 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 395.75 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 391.18 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 277.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 262.96 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 394.35 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 389.90 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 276.66 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 261.69 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 305.94 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 196.72 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 186.43 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 301.24 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 196.56 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 186.95 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 301.82 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 283.91 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 199.76 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 181.16 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 190.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 172.61 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 304.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 194.84 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 184.55 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 299.45 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 194.67 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 185.06 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 299.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 282.00 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 197.35 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 179.28 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 188.01 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 170.72 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 302.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 193.44 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 183.15 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 298.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 193.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 183.79 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 298.50 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 280.73 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 196.33 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 177.85 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 186.86 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 169.41 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 201.10 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 190.68 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 200.94 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 191.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 203.81 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 183.04 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 194.10 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 174.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 199.21 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 188.92 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 199.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 189.44 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 201.53 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 181.24 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 191.70 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 172.40 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 197.94 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 187.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 197.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 188.04 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 200.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 179.84 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 190.66 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 171.00 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 353.59 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 351.43 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 238.95 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 222.23 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 351.42 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 349.26 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 236.55 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 220.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 350.15 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 347.98 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 235.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 218.78 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 261.74 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 158.60 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 152.09 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 259.58 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 162.14 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 155.26 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 260.66 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 242.55 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 173.14 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 145.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 165.92 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 138.26 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 259.58 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 156.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 150.18 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 257.54 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 160.23 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 153.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 258.40 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 240.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 170.97 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 143.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 163.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 136.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 258.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 155.41 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 148.91 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 256.14 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 158.83 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 152.07 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 257.23 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 239.11 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 169.82 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 141.94 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 162.47 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.07 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 163.21 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 156.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 167.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 160.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 177.42 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 148.57 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 169.84 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 141.22 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 161.42 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 154.55 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 165.09 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 158.35 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 175.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 146.53 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 167.66 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 139.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 160.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 153.16 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 163.57 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 156.95 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 173.98 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 145.26 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 166.51 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 137.77 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 253.73 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 236.70 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 250.07 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 233.55 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 248.53 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 231.39 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 260.37 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 180.73 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 170.32 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 255.00 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 180.91 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 171.65 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 263.59 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 260.79 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 234.57 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 236.67 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 168.20 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 161.30 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 160.98 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 154.17 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 256.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 177.43 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 167.15 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 251.57 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 177.61 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 168.35 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 260.02 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 257.21 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 231.29 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 233.25 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 164.63 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 158.00 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 157.41 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 150.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 254.66 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 175.27 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 164.87 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 249.30 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 175.45 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 166.20 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 258.38 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 255.55 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 229.13 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 231.09 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 162.97 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 155.72 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 155.75 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 148.59 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 185.92 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 175.39 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 186.23 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 176.59 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 300.41 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 283.60 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 171.94 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 160.38 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 164.44 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 152.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 182.75 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 172.21 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 182.93 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 173.29 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 296.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 280.32 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 168.36 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 157.08 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 160.85 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 149.58 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 180.47 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 169.94 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 180.65 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 171.13 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 295.21 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 278.17 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 166.71 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 154.80 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 159.20 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 147.42 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 230.37 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 222.59 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 228.70 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 220.44 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 237.98 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 142.60 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 136.98 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 234.61 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 146.70 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 140.54 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 240.23 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 241.37 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 222.08 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 214.57 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 150.82 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.83 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 143.22 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 120.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 235.70 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 140.32 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 134.83 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 232.33 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 144.43 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 138.38 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 238.56 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 239.72 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 219.92 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 212.29 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 149.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.55 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 141.55 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 118.79 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 147.10 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 140.45 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 151.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 145.34 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 276.30 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 269.11 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 154.91 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 129.64 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 146.89 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 122.52 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 144.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 138.17 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 149.60 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 143.05 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 274.77 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 266.96 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 153.24 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 127.36 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 145.09 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.24 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 381.80 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 376.29 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 260.45 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 247.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 379.89 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 374.50 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 258.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 245.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 378.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 373.10 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 257.01 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 244.59 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 289.21 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 173.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 163.63 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 283.82 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 173.63 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 163.91 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 282.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 265.60 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 175.71 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 156.88 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 165.90 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 148.41 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 287.29 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 172.07 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 161.88 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 281.90 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 171.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 162.02 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 279.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 263.69 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 173.43 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 155.00 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 163.51 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 146.52 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 285.89 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 170.80 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 160.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 280.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 170.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 160.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 278.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 262.41 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 172.28 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 153.70 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 162.47 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 145.21 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 178.58 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 168.01 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 178.01 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 168.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 179.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 158.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 169.80 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 150.01 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 176.70 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 166.12 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 176.25 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 166.41 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 177.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 157.19 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 167.40 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 148.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 175.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 164.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 174.85 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 165.00 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 176.34 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 155.79 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 166.26 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 146.82 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 348.56 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 346.35 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 230.66 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 217.06 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 346.52 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 344.18 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 228.40 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 215.02 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 345.12 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 342.78 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 227.23 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 213.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 256.28 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 148.00 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 141.28 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 253.82 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 151.17 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 144.44 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 252.51 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 235.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 161.17 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 133.15 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 152.35 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.91 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 254.23 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 146.21 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 139.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 251.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 149.25 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 142.52 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 250.12 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 233.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 158.88 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 131.35 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 150.04 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 124.12 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 252.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 144.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 138.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 250.38 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 147.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 141.12 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 249.08 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 231.76 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 157.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 129.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 149.02 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 122.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 152.51 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 145.64 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 156.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 149.19 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 165.33 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 136.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 156.13 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 129.12 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 150.71 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 143.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 154.39 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 147.27 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 163.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 134.44 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 153.83 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 126.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 149.31 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 142.45 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 152.99 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 145.87 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 161.89 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 133.04 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 152.68 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 210.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 190.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 209.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 195.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 255.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 234.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 232.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 204.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 229.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 201.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 226.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 198.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 332.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 330.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 217.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 197.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 329.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 327.21 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 213.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 194.01 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 327.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 324.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 211.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 191.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 238.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 133.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 121.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 236.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 133.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 124.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 242.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 238.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 208.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 216.22 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 149.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 138.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 107.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 235.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 117.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 232.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 120.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 238.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 235.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 205.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 213.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 146.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 112.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 134.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 103.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 233.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 128.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 230.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 128.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 236.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 233.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 203.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 210.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 143.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 110.22 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 132.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 101.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 138.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 138.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 129.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 277.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 248.96 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 154.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 142.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 110.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 122.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 273.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 245.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 150.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 138.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 107.21 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 133.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 120.04 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 133.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 271.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 243.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 148.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 113.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 136.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 104.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 145.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 128.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 145.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 137.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 168.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 151.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 174.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 149.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 162.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 143.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 158.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 139.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 166.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 156.46 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 165.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 156.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 184.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 162.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 190.04 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 149.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 181.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 140.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 155.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 146.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 154.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 146.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 173.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 151.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 178.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 139.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 169.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 150.81 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 141.21 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 150.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 141.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 168.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 146.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 174.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 134.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 165.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 170.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 160.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 169.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 160.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 196.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 172.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 194.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 152.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 184.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 143.01 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 160.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 150.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 159.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 150.46 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 185.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 166.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 183.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 143.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 173.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 133.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 155.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 145.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 154.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 145.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 180.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 162.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 178.21 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 138.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 168.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 128.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 197.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 179.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 196.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 186.43 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 241.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 223.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 214.14 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 191.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 211.87 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 189.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 210.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 188.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 316.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 315.24 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 201.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 182.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 314.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 313.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 199.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 180.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 312.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 311.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 198.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 179.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 222.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 122.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 115.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 221.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 119.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 223.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 223.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 200.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 202.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 140.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 108.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 129.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 101.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 220.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 113.14 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 219.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 117.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 221.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 221.04 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 198.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 200.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 137.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 106.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 127.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 99.14 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 218.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 118.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 111.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 217.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 122.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 220.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 219.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 196.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 199.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 136.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 105.01 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 126.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 97.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 126.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 130.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 258.21 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 236.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 144.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 109.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 134.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 102.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 124.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 117.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 128.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 121.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 255.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 234.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 142.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 107.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 131.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 100.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 123.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 254.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 232.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 141.01 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 106.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 130.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 99.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 213.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 194.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 212.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 204.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 254.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 215.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 247.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 209.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 244.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 205.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 263.86 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 225.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 257.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 219.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 254.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 216.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 213.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 194.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 212.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 204.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 155.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 197.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 173.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 186.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 163.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 200.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 176.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 190.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 167.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 216.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 180.96 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 190.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 157.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 171.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 145.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 206.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 172.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 182.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 149.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 139.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 180.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 166.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 170.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 156.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 183.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 169.46 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 173.75 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 160.43 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 197.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 164.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 183.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 149.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 152.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 128.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 187.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 156.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 175.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 142.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 132.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 173.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 162.04 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 162.87 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 152.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 176.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 165.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 166.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 156.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 190.87 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 157.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 180.01 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 145.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 145.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 121.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 180.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 148.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 171.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 138.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 215.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 187.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 194.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 187.01 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 204.43 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 177.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 216.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 189.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 179.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 177.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 207.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 180.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 242.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 197.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 215.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 169.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 17-Jul-2025 10:58 178.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 187.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:58 162.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 160.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 231.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 187.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 205.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 161.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 195.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 178.86 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:58 182.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 167.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 184.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 168.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 196.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 180.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 168.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 157.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 187.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 172.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 220.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 177.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 207.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 161.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 17-Jul-2025 10:58 167.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 166.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 151.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 140.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 209.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 168.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 197.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 153.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 186.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 174.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:58 176.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 158.43 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 175.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 164.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 188.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 175.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 161.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 148.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 179.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 167.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 212.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 168.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 202.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 156.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 160.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 158.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 144.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 131.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 201.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 159.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 192.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 148.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 247.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 210.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 221.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 233.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 197.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 244.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 207.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 204.24 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 232.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 196.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 281.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 227.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 236.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 190.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 220.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 188.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 271.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 217.04 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 224.87 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 181.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 220.75 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 199.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 195.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 207.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 186.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 218.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 196.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 178.04 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 206.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 186.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 252.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 201.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 225.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 179.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 191.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 162.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 241.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 190.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 214.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 170.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 209.87 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 193.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 184.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 196.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 180.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 207.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 190.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 167.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 195.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 179.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 241.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 190.43 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 219.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 173.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 180.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 151.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 230.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 180.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 208.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 164.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 320.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 318.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 204.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 184.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 318.06 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 315.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 201.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 181.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 316.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 314.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 200.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 180.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 224.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 127.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 114.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 221.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.43 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 234.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 201.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 135.06 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 108.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 126.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 100.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 221.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 112.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 219.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 232.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 199.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 132.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 106.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 124.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 98.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 220.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 110.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 218.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 123.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 114.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 231.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 198.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 131.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 104.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 123.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 96.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 132.57 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 132.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 122.97 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 139.71 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 111.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 130.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 103.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 130.31 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 137.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 109.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 128.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 100.96 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 129.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 115.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 129.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 136.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 107.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 127.07 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 99.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 147.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.06 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 146.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 138.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 159.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 127.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 149.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 142.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 130.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 141.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 133.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 155.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 123.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 145.82 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 114.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 140.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 128.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 139.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 131.11 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 153.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 121.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 143.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 112.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 152.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 139.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 151.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 143.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 164.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 130.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 153.76 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 148.07 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 135.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 147.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 138.83 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 160.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.71 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 149.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 145.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 132.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 144.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 136.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 158.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 147.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 113.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 301.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 299.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 193.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 174.81 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 299.43 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 297.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 191.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 172.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 298.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 296.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 190.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 171.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 212.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 113.17 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 210.33 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 122.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 116.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 223.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 192.83 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 132.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 105.81 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 124.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 99.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 210.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 117.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 111.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 208.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 120.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 114.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 221.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 190.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 129.76 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 103.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 122.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 96.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 208.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 109.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 206.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 113.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 220.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 189.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 128.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 102.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 121.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 95.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 123.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 117.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 121.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 136.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 108.71 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 128.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 101.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 121.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 134.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 106.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 126.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 99.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 120.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 113.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 124.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 117.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 133.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 105.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 125.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 98.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 128.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 157.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 149.47 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 147.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 140.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 158.97 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 150.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 149.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 142.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 176.47 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 141.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 168.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 132.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 146.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 117.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 168.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 132.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 161.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.21 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 122.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 152.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 146.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 142.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 137.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 153.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 147.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 144.06 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 139.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 171.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 135.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 165.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 129.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 140.82 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 112.21 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 162.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 127.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 157.82 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 122.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 119.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 149.31 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 144.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 139.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 150.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 146.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 141.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 137.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 168.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 132.81 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 164.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 128.43 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 137.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 109.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 159.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 124.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 156.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 168.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 158.31 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 172.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 154.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 158.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 149.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 168.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 158.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 158.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 144.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 160.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 151.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 189.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 150.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 180.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 141.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 17-Jul-2025 10:58 157.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 158.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:58 141.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 127.06 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 180.06 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 141.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 171.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 132.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 161.82 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 154.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:58 166.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 147.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 152.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 146.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 162.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 155.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 152.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 138.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 153.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 147.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 183.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 144.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 176.35 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 137.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 151.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 152.33 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 135.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 120.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 173.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 167.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 129.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 158.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 152.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 163.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 144.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 148.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 144.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 158.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 153.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:58 149.07 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 134.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 150.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 145.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 179.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 140.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 174.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 17-Jul-2025 10:59 147.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 148.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 17-Jul-2025 10:58 132.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 117.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 170.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 131.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 165.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 192.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 176.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 179.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 180.96 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 165.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 190.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 174.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 161.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 180.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 165.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 215.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 174.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 203.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 158.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 180.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 145.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 203.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 163.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 191.47 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 148.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 184.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 172.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 171.76 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 173.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 160.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 182.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 169.96 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 153.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 172.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 160.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 208.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 166.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 198.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 153.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 172.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 138.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 196.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 156.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 186.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 143.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 180.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 169.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 167.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 168.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 158.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 178.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 167.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 149.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 168.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 158.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 203.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 161.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 195.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 151.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 168.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 133.81 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 191.18 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 151.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 183.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 141.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 215.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 197.07 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 214.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 194.92 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 261.72 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 243.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 229.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 209.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 226.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 207.49 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 225.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 206.11 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.24 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 116.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 129.87 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 120.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 238.89 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 232.11 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 207.40 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 201.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 138.11 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 110.53 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 128.02 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 101.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 114.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 236.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 229.81 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 205.25 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 199.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 135.81 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 108.36 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 125.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 99.35 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 126.67 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 113.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 126.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 117.27 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 235.56 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 228.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 203.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 197.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 134.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 106.96 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 124.69 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 98.08 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 121.00 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 135.04 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.51 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 275.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 256.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 142.76 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 113.57 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 132.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 104.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 132.99 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.83 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 132.87 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.22 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 273.42 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 254.27 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 140.47 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 111.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 129.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 101.99 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 131.72 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 117.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 131.47 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 121.94 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 272.26 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 252.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 139.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 110.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 128.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 100.72 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 153.09 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 138.75 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 152.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 138.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 174.38 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 162.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 170.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 155.10 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 166.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 150.66 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 164.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 147.99 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 149.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 137.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 148.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 140.65 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 180.51 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 154.93 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 164.83 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 132.04 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 152.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 121.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 145.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 133.27 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 144.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 136.21 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 176.58 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 150.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 160.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 127.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 148.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 117.18 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 142.94 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.60 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 141.93 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 133.66 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 174.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 147.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 158.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 146.56 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 114.51 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 155.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 142.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 154.21 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 145.57 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 191.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 178.46 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 169.46 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 134.08 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 156.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 123.15 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 150.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 137.68 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 149.78 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 141.26 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 187.40 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 174.15 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 165.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 129.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 152.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 148.36 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.01 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 147.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 138.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 185.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 171.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 163.22 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.10 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 150.56 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 201.63 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 183.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 200.97 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 181.10 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 248.02 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 229.75 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 213.50 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 195.71 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 211.22 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 193.67 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 210.18 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 192.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 121.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.69 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.90 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 223.32 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 221.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 193.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 191.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 133.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 107.03 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 126.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 100.08 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.67 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 113.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 123.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 116.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 221.01 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 219.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 191.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 189.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 131.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 104.87 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 123.93 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 97.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.27 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 112.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 121.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 115.33 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 219.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 217.99 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 190.02 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 188.32 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 130.02 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 103.47 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 122.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 96.51 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 126.47 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.81 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.46 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.82 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 260.14 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 242.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 137.85 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 110.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 130.33 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 102.72 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 124.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 117.64 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 128.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 121.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 257.86 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 240.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 135.56 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 107.89 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 128.04 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 100.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 123.02 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 126.89 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 256.83 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 239.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 134.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 106.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 126.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 99.28 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 207.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 189.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 207.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 187.69 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 254.43 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 236.21 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 221.96 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 202.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 219.68 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 200.26 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 218.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 199.00 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 322.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 320.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 202.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 183.92 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 320.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 318.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 200.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 181.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 318.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 317.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 198.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 180.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 226.28 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 129.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 224.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 128.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 119.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 231.92 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 232.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 200.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 201.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 133.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 107.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 126.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 100.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 224.11 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 126.79 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 113.46 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 222.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 126.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 117.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 229.61 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 230.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 198.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 199.67 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 131.43 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 104.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 123.98 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 97.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 222.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 112.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 221.00 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 228.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 229.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 196.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 198.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 130.28 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 103.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 122.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 96.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 134.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 133.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 124.25 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 268.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 249.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 138.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 110.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 130.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 102.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 131.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 117.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 131.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 122.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 266.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 247.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 135.83 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 107.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 128.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 100.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.56 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 116.31 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.31 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.68 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 265.29 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 245.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 134.68 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 106.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 127.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 99.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 145.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 130.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 145.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 130.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 166.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 154.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 162.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 147.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 158.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 142.90 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 156.29 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 140.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 148.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 136.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 147.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 139.36 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 172.74 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 147.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 158.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 126.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 149.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 144.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 132.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 143.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 134.93 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 168.81 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 142.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 154.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 122.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 145.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 114.60 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 141.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 129.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 140.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 132.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 166.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 140.18 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 151.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 143.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 111.93 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 154.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 141.00 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 152.93 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 144.28 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 183.58 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 170.69 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 162.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 128.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 153.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 149.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 136.56 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 148.50 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 139.98 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 179.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 166.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 158.80 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 124.29 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 149.58 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 116.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 147.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 133.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 145.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 137.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 177.46 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 163.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 156.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 121.61 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 147.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 113.46 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 197.60 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 179.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 196.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 177.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 243.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 225.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 209.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 191.58 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 206.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 189.53 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 205.80 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 188.15 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 303.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 301.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 191.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 174.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 301.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 299.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 189.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 171.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 299.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 297.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 188.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 170.68 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 213.72 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 114.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 211.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 124.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 117.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 218.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 221.69 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 189.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 192.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 131.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 105.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 124.10 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 98.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 211.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.43 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 112.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 209.53 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 121.87 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 115.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 216.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 219.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 187.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 189.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 129.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 103.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 121.81 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 96.60 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 210.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 117.03 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 110.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 208.26 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 114.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 215.61 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 218.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 186.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 188.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 128.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 102.18 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 120.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 95.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 118.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 129.21 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 122.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 255.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 238.22 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 136.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 108.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 128.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 101.42 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 123.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 116.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 126.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 253.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 236.18 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 133.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 106.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 125.79 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 99.25 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 121.78 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 119.00 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 252.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 234.80 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 132.83 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 105.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 124.74 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 97.98 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 205.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 188.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 204.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 188.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 231.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 205.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 228.21 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 202.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 226.69 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 200.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 241.31 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 204.72 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 238.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 201.69 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 236.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 199.78 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 205.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 188.61 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 204.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 188.08 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 322.22 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 320.63 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 203.32 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 184.80 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 320.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 318.46 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 201.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 182.63 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 318.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 317.19 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 199.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 181.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 226.27 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 129.07 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.74 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 224.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 128.82 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 119.56 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 233.59 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 202.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 135.06 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 108.33 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 126.31 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 100.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 224.09 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 126.90 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 113.57 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 222.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 126.52 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 117.27 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 231.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 200.43 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 132.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 106.28 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 124.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 98.07 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 222.82 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.50 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 112.17 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 221.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.25 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 230.15 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 199.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 131.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 104.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 122.97 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 96.79 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 134.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 119.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 133.99 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 124.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 139.59 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 111.35 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 130.42 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 102.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 131.95 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 117.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 131.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 122.06 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 137.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 109.18 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 128.14 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 100.71 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 116.42 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 130.42 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.79 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 136.13 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 107.91 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 127.07 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 99.44 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 148.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 136.57 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 147.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 139.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 159.86 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 149.78 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 119.26 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 144.19 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 132.14 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 143.43 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.04 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 155.95 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.67 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 145.82 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 114.95 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 141.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 129.47 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 140.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 132.49 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 153.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 121.00 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 143.54 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 112.27 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 154.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 140.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 153.04 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 144.39 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 164.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 130.15 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 153.76 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.91 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 149.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 136.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 148.61 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 139.96 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 160.71 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.84 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 149.80 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.48 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 147.06 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 134.00 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 146.06 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 137.41 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 158.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.17 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 147.52 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 113.81 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 303.33 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 301.31 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 192.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 175.07 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 301.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 299.14 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 190.07 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 172.90 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 299.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 297.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 189.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 171.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 213.83 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 114.43 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 211.81 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 124.15 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 117.76 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 222.63 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 192.96 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 131.93 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 105.81 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 124.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 98.92 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 211.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 118.54 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 112.26 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 209.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 121.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 115.59 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 220.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 190.79 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 129.63 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 103.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 122.09 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 96.75 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 210.27 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 117.14 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 110.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 208.24 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.58 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 114.19 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 219.17 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 189.52 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 128.61 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 102.24 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 120.91 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 95.48 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.68 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 129.20 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 122.68 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 136.32 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 108.71 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 128.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 101.57 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.51 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 120.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 134.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 106.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 126.07 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 99.40 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 121.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 115.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 125.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 119.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 132.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 105.27 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 125.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 98.12 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 216.41 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 196.02 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 215.34 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 200.86 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 260.91 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 240.39 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 238.34 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 209.91 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 234.80 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 206.73 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 232.65 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 204.47 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 340.38 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 338.63 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 220.09 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 203.22 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 337.20 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 335.46 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 216.55 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 199.92 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 334.92 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 333.18 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 214.37 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 197.64 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 245.50 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 135.56 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 122.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 243.88 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.33 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.46 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 248.03 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 241.68 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 214.59 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 220.20 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 149.80 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 115.80 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 137.77 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 107.10 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 242.33 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 132.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 119.34 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 240.59 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 132.03 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 122.16 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 244.47 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 238.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 211.43 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 216.91 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 146.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 112.50 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 134.20 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 103.80 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 240.05 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 129.98 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 117.06 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 238.31 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 129.75 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 119.89 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 242.44 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 235.96 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 209.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 214.62 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 143.98 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 110.35 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 132.05 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 101.66 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 140.70 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 126.75 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 140.34 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 130.34 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 282.84 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 254.63 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 154.20 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 119.39 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 142.12 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 110.28 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 137.40 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.58 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 137.04 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.04 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 279.43 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 251.46 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 150.67 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.20 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 138.69 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 107.09 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 135.12 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 121.30 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 134.77 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 124.76 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 277.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 249.20 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 148.50 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 113.81 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 136.41 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 104.70 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 149.08 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 132.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 149.07 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 141.07 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 172.01 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 155.34 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 177.82 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 153.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 166.53 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 147.59 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 161.84 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 143.40 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 167.70 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 157.74 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 166.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 157.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 188.03 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 165.81 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 190.17 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 149.98 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 181.08 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 140.51 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 157.26 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 147.28 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 156.35 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 147.48 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 176.86 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 155.10 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 179.02 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 139.57 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 169.79 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.21 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 152.58 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 142.59 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 151.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 142.66 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 172.17 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 150.66 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 174.20 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 134.89 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 165.10 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.52 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 172.08 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 161.87 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 171.27 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 161.88 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 200.49 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 176.50 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 194.30 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 152.98 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 184.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 142.88 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 161.76 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 151.78 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 160.85 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 151.73 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 189.22 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 170.31 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 183.15 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 143.88 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 173.65 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 133.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 156.95 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 146.97 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 156.17 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 146.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 184.54 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 166.13 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 178.34 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 139.05 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 168.96 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 128.81 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 201.83 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 183.98 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 201.18 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 191.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 246.33 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 228.35 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 218.80 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 196.64 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 216.53 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 194.60 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 215.49 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 193.22 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 323.52 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 321.65 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 204.83 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 189.18 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 321.36 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 319.48 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 202.52 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 187.14 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 320.09 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 318.08 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 201.39 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 185.74 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 228.78 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.45 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 116.59 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 226.78 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 127.18 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 120.20 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 228.64 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 226.55 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 204.27 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 206.29 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 140.20 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 108.44 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 129.77 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 101.19 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 226.61 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 121.29 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 114.42 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 224.61 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.26 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 118.28 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 226.34 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:58 224.24 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 202.23 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 204.12 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 137.92 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 106.27 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 127.46 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 99.02 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 225.21 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.01 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 113.02 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:59 223.34 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.86 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 116.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 225.31 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 17-Jul-2025 10:59 223.11 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 200.84 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 17-Jul-2025 10:58 202.84 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 136.76 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 104.87 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 126.32 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 97.62 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 127.95 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 120.95 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 132.10 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 124.98 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 262.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 240.96 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 144.45 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 109.75 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 133.99 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 102.12 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 125.79 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 118.78 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 130.18 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 123.06 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 260.59 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 238.92 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 142.17 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 107.95 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:59 131.80 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 100.34 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 124.39 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 117.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 128.78 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 121.66 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 259.57 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 237.54 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 141.13 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:58 106.55 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 17-Jul-2025 10:58 130.66 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 17-Jul-2025 10:59 98.93 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 218.85 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 199.86 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 218.08 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 210.84 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 259.84 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 221.44 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 253.33 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 215.02 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 249.93 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 211.49 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 269.53 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 232.09 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 263.16 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 225.80 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 259.73 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:59 222.27 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:58 218.98 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 199.98 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 17-Jul-2025 10:59 218.08 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 17-Jul-2025 10:58 210.96 KB
LICENSE 17-Jul-2025 10:58 11.09 KB
Artifactory/7.117.14 Server