Index of sw-kernelinferencelibrary-public-generic-local/c8e0abb4b0438880a2b0a9b68449e3cf1513aadf/fmha/trtllm-gen
Name Last modified Size
../
flashInferMetaInfo.h 04-Aug-2025 22:38 700.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 396.72 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 392.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 279.28 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 264.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 395.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 390.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 277.39 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 262.55 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 394.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 389.63 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 276.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 261.42 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 305.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 195.91 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 185.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 300.43 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 195.74 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 186.13 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 301.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 283.10 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 198.94 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 180.34 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 189.48 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 171.79 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 303.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 194.41 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 184.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 299.05 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 194.25 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 184.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 299.24 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 281.59 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 197.07 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 178.87 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 187.59 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 170.31 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 302.48 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 193.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 183.01 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 297.79 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 193.13 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 183.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 298.23 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 280.46 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 196.06 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 177.71 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 186.72 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 169.15 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 200.28 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 189.87 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 200.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 190.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 203.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 182.22 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 193.28 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 173.38 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 198.79 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 188.50 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 198.62 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 189.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 201.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 180.84 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 191.41 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 171.99 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 197.67 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 187.26 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 197.51 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 187.90 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 200.24 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 179.58 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 190.39 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 170.86 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 353.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 350.86 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 238.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 221.66 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 351.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 348.85 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 236.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 219.65 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 349.88 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 347.72 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 235.25 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 218.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 261.18 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 157.78 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 151.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 259.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 161.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 154.44 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 259.97 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 241.98 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 172.32 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 165.11 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.44 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 259.16 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.40 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.77 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 257.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.81 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.93 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 257.99 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 239.97 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 170.44 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.93 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 163.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.93 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 258.04 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.27 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.63 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 255.87 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 158.43 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 151.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 257.09 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 238.84 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 169.55 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 141.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 162.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.80 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 162.39 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.52 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 166.20 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.33 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 176.60 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.01 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 169.02 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.65 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 161.01 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 154.14 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 164.56 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 157.95 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 174.72 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 167.12 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.64 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.75 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.88 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 163.30 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.81 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 173.71 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.98 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 166.24 KB
fmhaSm100Kernel_QBfloat16KvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.51 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 252.91 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 236.02 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 249.66 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 233.14 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 248.27 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 231.12 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 259.55 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 179.78 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 169.50 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 254.18 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 180.09 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 170.83 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 262.77 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 259.98 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 233.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 235.98 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 167.38 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 160.48 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 160.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 153.23 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 256.54 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 177.02 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 166.74 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 251.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 177.20 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 167.94 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 259.62 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 256.80 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 230.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 232.84 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 164.23 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 157.59 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 157.00 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.46 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 254.52 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 175.01 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 164.73 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 249.15 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 175.19 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 165.93 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 258.11 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 255.28 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 228.99 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 230.83 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 162.83 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.58 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 155.60 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.33 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 185.10 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 174.57 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 185.28 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 175.64 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 299.59 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 282.91 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 171.12 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.44 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 163.74 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.05 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 182.34 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 171.80 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 182.52 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 172.88 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 296.46 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 279.91 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 167.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.67 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 160.45 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 180.33 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 169.66 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 180.51 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 170.87 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 294.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 277.90 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 166.44 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 154.66 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 158.94 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 229.96 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 222.18 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 228.56 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 220.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 237.57 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.19 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 136.58 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 234.20 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.30 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.13 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 239.82 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 240.96 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 221.66 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 214.16 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 150.41 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.41 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 142.69 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.53 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 235.55 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.18 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.56 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 232.19 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.28 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.12 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 238.42 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 239.45 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 219.78 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 212.15 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.89 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.41 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 141.29 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.52 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.70 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.04 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 151.47 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.92 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 275.90 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 268.70 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 154.50 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.23 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 146.35 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.11 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.68 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.02 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.46 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.79 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 274.50 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 266.69 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 152.98 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.22 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 144.95 KB
fmhaSm100Kernel_QE4m3KvE2m1OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 380.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 375.47 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 259.63 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 246.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 379.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 374.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 257.74 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 245.57 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 378.34 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 372.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 256.87 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 244.31 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 288.39 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 173.13 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 162.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 283.00 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 172.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 163.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 281.35 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 264.78 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 174.89 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.07 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 165.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.59 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 286.88 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 171.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 161.45 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 281.49 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 171.45 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 161.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 279.46 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 263.27 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 173.02 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 154.59 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 163.22 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.11 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 285.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 170.53 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 160.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 280.36 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 170.21 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 160.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 278.46 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 262.14 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 172.02 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 153.43 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 162.33 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.07 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 177.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 167.19 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 177.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 167.34 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 179.07 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 158.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 168.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.19 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 176.27 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 165.70 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 175.83 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 165.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 177.08 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 166.99 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.68 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 175.16 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 164.58 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 174.71 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 164.86 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 176.20 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.64 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 166.11 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.55 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 348.00 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 345.78 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 229.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 216.50 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 346.11 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 343.77 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 227.99 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 214.61 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 344.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 342.64 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 227.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 213.48 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 255.71 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.19 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.46 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 253.25 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.35 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 143.50 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 251.69 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 234.63 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 160.35 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.33 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 151.66 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.09 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 253.83 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.80 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.08 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 251.37 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.12 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 249.84 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 232.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 158.47 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 130.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 149.76 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.72 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 252.57 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.67 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.95 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 250.23 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.71 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 248.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 231.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 157.46 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.81 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.75 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.59 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 151.69 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.82 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.36 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.24 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 164.52 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.91 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 155.32 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.55 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 143.44 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 153.98 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.86 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 162.62 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.03 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 153.41 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.55 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.05 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.30 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.85 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.73 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 161.74 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.90 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 152.54 KB
fmhaSm100Kernel_QFp16KvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 210.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 190.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 209.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 195.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 255.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 234.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 231.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 203.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 228.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 200.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 226.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 198.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 331.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 329.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 216.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 196.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 329.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 326.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 213.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 193.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 326.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 324.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 211.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 191.46 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 237.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 235.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.01 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 241.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 238.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 208.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 215.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 137.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 235.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 130.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 232.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 130.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 238.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 235.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 205.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 212.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 146.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 112.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 134.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 103.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 232.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 230.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 236.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 232.96 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 203.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 210.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 143.83 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 109.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 132.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 101.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 276.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 248.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 153.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 141.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 109.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 273.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 245.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 150.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 138.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 271.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 243.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 136.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 104.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 145.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 128.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 145.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 137.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 168.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 151.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 172.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 148.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 162.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 142.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 157.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 138.96 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 162.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 153.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 162.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 153.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 182.96 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 157.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 188.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 179.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 154.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 153.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.14 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 172.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 150.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 178.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 169.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.87 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 168.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 146.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 173.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 164.82 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 167.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 157.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 166.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 157.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 195.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 170.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 192.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 183.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 158.29 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 184.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 165.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 182.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 173.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 154.01 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.24 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 180.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 161.81 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 177.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 168.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 197.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 179.32 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 196.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 186.43 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 241.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 223.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 213.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 191.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 211.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 189.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 210.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 188.40 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 315.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 314.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 200.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 182.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 313.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 312.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 198.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 180.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 312.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 311.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 197.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 179.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 221.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 220.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.86 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 223.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 222.53 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 199.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 202.24 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 139.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 129.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 100.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 219.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 112.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 218.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 221.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 220.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 197.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 200.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 137.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 105.87 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 127.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 98.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 218.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 111.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 217.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 220.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 219.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 196.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 199.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 136.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 104.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 126.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 97.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 257.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 235.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 143.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 109.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 133.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 101.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 255.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 233.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 141.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 131.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 100.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.86 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.85 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 254.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 232.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 140.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 130.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 98.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 213.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 194.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 212.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 204.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 253.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 214.57 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 247.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 208.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 244.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 205.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 262.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 224.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 257.21 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 219.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 253.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 215.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 213.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 194.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 212.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 204.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 151.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 192.75 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 173.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 182.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 163.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 196.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 176.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 186.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 167.36 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 214.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 176.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 190.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 169.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 141.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 204.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 168.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 181.66 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 139.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 180.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 165.56 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 169.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.26 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 183.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 168.95 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 173.45 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.92 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 197.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 164.13 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 183.54 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 151.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 128.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 186.63 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 175.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 131.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 172.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 162.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 162.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.74 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 175.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 165.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 166.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 190.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.81 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 179.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.03 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 145.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 121.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 180.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 171.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 210.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 187.11 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 194.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 181.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 199.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 177.22 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 211.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 188.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 179.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 172.31 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 202.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 180.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 239.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 192.34 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 214.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 169.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 178.73 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 185.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 162.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 155.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 228.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 183.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 204.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 161.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 194.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 178.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 182.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 166.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 184.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 168.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 196.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 179.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 168.02 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 157.17 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 187.44 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 171.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 219.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 177.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 206.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 160.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 166.72 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 165.07 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 150.91 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 140.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 208.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 167.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 197.00 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 186.09 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 174.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 176.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 157.89 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 175.12 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 164.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 187.60 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 175.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 162.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 148.29 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 178.51 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 167.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 212.28 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 168.16 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 202.68 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.49 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 160.62 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 157.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 144.94 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 131.20 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 201.21 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 192.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.50 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 238.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 207.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 213.42 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 224.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 194.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 235.64 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 205.06 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 195.67 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 224.19 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 194.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 278.77 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 218.90 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 234.39 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 188.10 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 217.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 180.33 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 268.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 208.47 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 222.98 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 178.70 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 218.35 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 197.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 193.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 204.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 185.29 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 215.61 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 195.25 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 175.52 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 204.05 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 184.78 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 250.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 198.79 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 224.71 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 178.38 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 189.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 160.22 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 239.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 188.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 213.30 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 168.99 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 208.55 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 192.97 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 183.59 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 194.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 180.27 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 205.93 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 190.23 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 165.84 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 194.37 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 179.76 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 240.80 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 189.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 219.18 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 173.48 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 179.69 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 150.41 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 230.08 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 178.65 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 207.88 KB
fmhaSm100Kernel_QkvBfloat16OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 164.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 319.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 317.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 203.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 183.35 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 317.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 315.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 201.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 181.47 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 316.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 314.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 200.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 180.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 223.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 221.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 233.83 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 201.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 134.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 125.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 99.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 221.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.82 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 111.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 219.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 231.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 199.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 132.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 105.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 123.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 97.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 220.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.69 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 110.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 218.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 230.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 198.01 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 131.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 104.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 122.82 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 96.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 138.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 110.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 129.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 102.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 137.01 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 108.76 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 127.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 100.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 135.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 126.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 99.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 136.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 158.63 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 141.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 155.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 145.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.06 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 130.95 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 153.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 143.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 111.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 141.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 163.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 152.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 159.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 149.11 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.21 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 136.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 157.97 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 147.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.63 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 301.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 299.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 192.97 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 174.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 299.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 297.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 191.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 172.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 297.88 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 295.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 190.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 171.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 211.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 112.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 209.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 223.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 192.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 131.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 105.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 123.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 98.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 209.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.74 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 110.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 207.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 221.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 190.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 129.35 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 103.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 121.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 96.47 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 208.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 109.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 206.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 112.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 220.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 189.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 128.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 102.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 120.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 95.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 135.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 108.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 127.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 101.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 133.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 125.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 99.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.71 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 132.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 105.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 124.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 97.98 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 128.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 157.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.56 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 151.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.69 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 175.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 141.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 168.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 145.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 117.34 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 166.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.65 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 160.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 123.00 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.05 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 153.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.28 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 170.62 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 165.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.79 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 140.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 112.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 161.91 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 157.55 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64CgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 119.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.11 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.60 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 141.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.32 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 167.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 163.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.17 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 137.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 109.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 159.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 155.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta128PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 170.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 158.50 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 172.46 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 156.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 160.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.70 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 170.54 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 158.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 146.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 162.19 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 151.24 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 187.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 179.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 141.35 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 157.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 157.04 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 141.17 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 129.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 178.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 143.53 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 170.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 162.26 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 154.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 166.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 147.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 162.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 151.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 138.29 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 154.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.47 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 182.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 175.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 150.92 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 151.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 134.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 120.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 172.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 167.30 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.07 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 158.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 163.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 144.15 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 143.86 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 158.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 153.07 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 148.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 134.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.40 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 179.10 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.96 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 173.99 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Persistent2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 147.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 148.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128Static2CtaKeepsAbForGen.cubin 04-Aug-2025 22:38 131.87 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 117.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 169.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 165.23 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta256PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.13 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 193.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 176.49 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 179.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 181.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 165.39 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 191.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 174.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 161.84 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 181.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 165.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 213.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 174.89 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 201.75 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 157.90 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 178.59 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 146.45 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 201.67 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 164.58 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 190.08 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP16VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 184.69 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 171.72 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 171.51 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 173.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 160.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 182.61 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 169.64 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 153.42 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 172.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 160.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 206.81 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 166.22 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 197.73 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 153.25 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 171.43 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 138.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 194.52 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.78 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 185.93 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP32VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 143.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 180.03 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 169.27 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 166.85 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 168.48 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 158.16 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 178.09 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 167.20 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 148.77 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 168.02 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64MultiCtasKvVarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 157.94 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 202.66 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 161.44 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 195.14 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ16Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.80 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 167.41 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ64Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 133.38 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 190.37 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 151.12 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 183.36 KB
fmhaSm100Kernel_QkvE4m3OBfloat16HQk576HV512HVPerCta512PagedKvDenseP64VarSeqQ8Kv64StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.92 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 215.19 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 197.10 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 214.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 194.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 261.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 243.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 228.38 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 209.00 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 226.51 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 207.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 225.49 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 205.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.33 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.18 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 238.21 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 231.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 206.87 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 200.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 137.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 109.99 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 127.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 100.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.70 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.33 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 236.44 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 229.56 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 204.87 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 198.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 135.56 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 125.36 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 98.97 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.56 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 235.43 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 228.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 203.74 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 197.66 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 134.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.85 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 124.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 97.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.46 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.50 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.85 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 275.02 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 255.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 141.98 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.03 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 131.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 103.63 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.74 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.58 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.96 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 273.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 253.89 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 140.09 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 111.15 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 129.47 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 101.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.61 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.83 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 272.13 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 252.76 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 139.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 110.02 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 128.55 KB
fmhaSm100Kernel_QkvE4m3OE2m1H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 100.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 153.12 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 138.78 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 152.87 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 138.26 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 174.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 162.32 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 169.32 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 153.40 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 165.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 149.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 164.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 147.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.07 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 179.56 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 153.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 163.74 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 130.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 151.61 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 144.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 143.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.68 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 176.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 149.71 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 160.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.40 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.81 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 130.47 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 174.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 147.57 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 158.32 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.93 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 146.44 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.38 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 153.77 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.64 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 143.99 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 190.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 176.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 168.25 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.50 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 155.60 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.45 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.38 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 136.90 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.24 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.60 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 186.99 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 173.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 164.87 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.11 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 152.18 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 148.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.59 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 185.11 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 171.10 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 162.95 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.97 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 150.31 KB
fmhaSm100Kernel_QkvE4m3OE2m1H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.92 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 201.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 183.40 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 201.00 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 181.13 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 248.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 229.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 212.84 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 195.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 210.97 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 193.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 210.07 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 192.29 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.18 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.03 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.75 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.36 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 222.53 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 220.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 192.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 191.23 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 132.67 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 125.42 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 99.41 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.14 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.74 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.35 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 220.76 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 218.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 191.05 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 189.34 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 130.78 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 104.50 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 123.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 97.53 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 112.01 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.61 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.22 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 219.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 217.88 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 189.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 188.21 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 129.91 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 103.37 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 122.62 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 96.40 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.93 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.28 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.80 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.16 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 259.48 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 242.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 137.20 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 109.54 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 129.53 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 102.19 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.92 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.39 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.15 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 257.61 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 240.32 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 135.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.65 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 127.64 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 100.17 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.79 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.13 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.66 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.02 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 256.71 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 239.19 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 134.30 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.52 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 126.73 KB
fmhaSm100Kernel_QkvE4m3OE2m1H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 99.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 207.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 189.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 207.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 187.69 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 254.43 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 236.21 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 221.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 201.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 219.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 199.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 218.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 198.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 321.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 319.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 201.56 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 183.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 319.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 318.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 199.67 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 181.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 318.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 316.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 198.80 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 180.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 225.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 223.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 231.10 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 231.83 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 199.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 201.15 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 132.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 125.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 99.37 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 223.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 221.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.75 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 229.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 229.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 197.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 199.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 131.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 104.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 123.58 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 97.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 222.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.25 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 111.92 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 220.86 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.00 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 228.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 228.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 196.59 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 198.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 130.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 103.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 122.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 96.35 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 267.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 248.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 137.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 109.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 129.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 102.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.43 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.67 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 266.04 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 246.74 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 135.42 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.51 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 127.69 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 100.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 130.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 130.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 265.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 245.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 134.41 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 126.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 99.00 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 145.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 130.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 145.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 130.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 166.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 154.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 161.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 145.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 158.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 142.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 156.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 139.81 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.03 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 171.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 145.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 156.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 143.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.21 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.76 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.36 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 168.37 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 141.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 153.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.18 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 144.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 141.50 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.74 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 166.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 139.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 151.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 143.03 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 111.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.45 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 151.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.68 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 182.57 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 168.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 161.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 152.31 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.93 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.29 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 179.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 165.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 157.98 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.92 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.61 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 177.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 163.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 156.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 147.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 197.60 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 179.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 196.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 177.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 243.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 225.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 208.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 191.01 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 206.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 189.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 205.54 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 187.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 302.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 300.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 190.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 173.43 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 300.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 298.75 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 188.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 171.55 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 299.63 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 297.62 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 187.82 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 170.41 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 213.16 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.75 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 211.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 218.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 220.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 188.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 191.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 131.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 105.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 123.29 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 98.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 211.14 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 111.87 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 209.12 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.46 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 216.23 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 218.98 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 187.03 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 189.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 129.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 103.05 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 121.40 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 96.20 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 210.01 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 110.73 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 207.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 215.34 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 218.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 185.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 188.30 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 128.17 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 101.91 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 120.49 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 95.06 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.00 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.88 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 254.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 237.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 135.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 127.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 100.85 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.65 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.51 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.99 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 253.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 235.77 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 133.44 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.07 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 125.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 98.84 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.86 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.38 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.86 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 252.19 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 234.64 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 132.56 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 104.94 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 124.47 KB
fmhaSm100Kernel_QkvE4m3OE4m3H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 97.71 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 205.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 188.48 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 204.27 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 188.08 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 230.70 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 204.33 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 228.09 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 201.95 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 226.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 200.32 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 240.66 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 203.52 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 237.89 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 201.02 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 236.51 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 199.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 205.13 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 188.61 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 204.39 KB
fmhaSm100Kernel_QkvE4m3OE4m3HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 188.08 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 321.65 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 320.06 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 202.63 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 184.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 319.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 318.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 200.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 182.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 318.51 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 316.92 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 199.74 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 181.09 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 225.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 223.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.74 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 232.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 202.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 134.24 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.76 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 125.49 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 99.67 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 223.69 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.49 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 221.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.24 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.86 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 230.89 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 200.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 132.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 105.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 123.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 97.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 222.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 112.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 220.84 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 230.01 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 198.89 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 131.46 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 104.74 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 122.70 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 96.52 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.42 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 138.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 110.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 129.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 102.31 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.54 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.29 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.29 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 136.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 108.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 127.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 100.30 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 130.41 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 130.16 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.52 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 135.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 126.80 KB
fmhaSm100Kernel_QkvE4m3OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 99.17 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.71 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.13 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 158.63 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.99 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.40 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 143.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.32 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.35 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 155.26 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 145.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.00 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 141.61 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.18 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 153.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.72 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 143.26 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 111.99 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.44 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 151.43 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.79 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 163.39 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.41 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 152.53 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.19 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 149.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 135.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.91 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.40 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 160.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 149.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 147.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 133.72 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 145.91 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.26 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 158.10 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.01 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 147.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 302.76 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 300.74 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 191.67 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 174.50 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 300.75 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 298.73 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 189.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 172.49 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 299.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 297.60 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 188.77 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 171.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 213.14 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.02 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.87 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 211.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.45 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.06 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 221.81 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 192.39 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 131.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 105.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 123.56 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 98.36 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 211.25 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 111.85 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 209.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.57 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.18 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 219.93 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 190.38 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 129.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 103.23 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 121.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 96.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 210.00 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.88 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 110.72 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 208.10 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.44 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.05 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 219.03 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 189.25 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 128.34 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 102.10 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 120.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 95.21 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.64 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.11 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.50 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 135.50 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 108.14 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 127.55 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 101.00 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.76 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.10 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.98 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 133.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.26 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 125.66 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 98.99 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.62 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.97 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.48 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.84 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 132.61 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 105.12 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 124.75 KB
fmhaSm100Kernel_QkvE4m3OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 97.86 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 216.41 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 196.02 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 215.34 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 200.86 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 260.91 KB
fmhaSm100Kernel_QkvFp16OFp16H128PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 240.39 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 237.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 209.22 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 234.65 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 206.45 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 232.38 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 204.31 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 339.68 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 337.94 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 219.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 202.53 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 336.79 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 335.17 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 216.39 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 199.64 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 334.66 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 332.91 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 214.09 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 197.50 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 244.94 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.74 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.83 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 243.20 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.51 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.65 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 247.22 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 240.86 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 214.02 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 219.51 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.98 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.11 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 136.95 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.41 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 242.05 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.98 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.06 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 240.30 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.74 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.88 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 244.31 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 238.11 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 211.15 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 216.62 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 146.11 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 112.22 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 134.05 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 103.65 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 239.78 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.84 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.92 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 238.16 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.61 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.74 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 242.17 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 235.82 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 209.01 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 214.48 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 143.84 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 110.09 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 131.78 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 101.38 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.88 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.06 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 139.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 282.02 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 253.95 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 153.38 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.57 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 141.31 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 109.59 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.12 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.30 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 136.76 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.75 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 279.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 251.18 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 150.52 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 115.79 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 138.53 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.70 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.85 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.03 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.49 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.62 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 277.01 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 249.04 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 148.23 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 113.55 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 136.27 KB
fmhaSm100Kernel_QkvFp16OFp16H128PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 104.44 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 149.08 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 132.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 149.07 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 141.07 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 172.01 KB
fmhaSm100Kernel_QkvFp16OFp16H256PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 155.34 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 176.39 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 151.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 166.08 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 146.26 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 161.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 142.74 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 164.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 154.58 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 163.65 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 154.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 186.62 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 161.64 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 188.62 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.73 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 179.53 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 137.51 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.31 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.34 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.41 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.41 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 176.30 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 154.16 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 178.43 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.47 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 169.34 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.25 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 152.04 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.06 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 151.13 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.26 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 171.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 150.13 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 173.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 134.46 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 164.82 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.98 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 169.06 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.08 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 168.16 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.02 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 198.97 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 174.64 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 192.77 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.62 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 183.27 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 140.53 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 160.82 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.84 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 159.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 150.78 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 188.64 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 168.99 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 182.57 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 142.91 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 173.06 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 132.80 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 156.54 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.56 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 155.63 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 146.51 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 184.25 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 165.47 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 178.05 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 138.64 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 168.55 KB
fmhaSm100Kernel_QkvFp16OFp16H256PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.53 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 201.83 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 183.98 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 201.18 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 191.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 246.33 KB
fmhaSm100Kernel_QkvFp16OFp16H64PackedQkvSlidingOrChunkedCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 228.35 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 217.99 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 196.08 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 216.12 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 194.20 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 215.23 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 193.06 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 322.96 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 320.96 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 204.02 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 188.62 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 320.95 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 319.07 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 202.23 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 186.73 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 319.81 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 317.94 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 201.24 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvCustomP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 185.59 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 228.09 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.89 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.02 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 226.21 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 126.36 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 227.83 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 225.73 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 203.70 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 205.72 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 139.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.74 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 128.95 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 100.50 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 226.20 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 114.01 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 224.20 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.85 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.87 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 225.92 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 223.83 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 201.83 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 203.71 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 137.52 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 105.86 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 127.05 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 98.61 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 225.07 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 119.74 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 112.88 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 223.07 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 123.72 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 116.74 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 225.05 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128PersistentKeepsAbForGen.cubin 04-Aug-2025 22:38 222.84 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 200.70 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ128Kv128StaticKeepsAbForGen.cubin 04-Aug-2025 22:38 202.58 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 136.49 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 104.73 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 126.05 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvDenseP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 97.48 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 127.39 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 120.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 131.28 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.16 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 262.05 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 240.40 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 143.63 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 108.93 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 133.17 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP16VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 101.43 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 125.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 118.37 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 129.77 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 122.65 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 260.18 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 238.52 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 141.77 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 107.55 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 131.27 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP32VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 99.92 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 124.25 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvCgaVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 117.23 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 128.64 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64MultiCtasKvVarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 121.52 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 259.30 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 237.38 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 140.87 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ16Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 106.41 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128PersistentSwapsAbForGen.cubin 04-Aug-2025 22:38 130.39 KB
fmhaSm100Kernel_QkvFp16OFp16H64PagedKvSlidingOrChunkedCausalP64VarSeqQ8Kv128StaticSwapsAbForGen.cubin 04-Aug-2025 22:38 98.79 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 218.85 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 199.86 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 218.08 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PackedQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 210.84 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 258.70 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 220.24 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 253.06 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 214.62 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 249.77 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvCausalP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 211.22 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 268.41 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP16VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 230.89 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 262.88 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP32VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 225.26 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 259.59 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128PagedKvDenseP64VarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 222.00 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 218.98 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvCausalVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 199.98 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128PersistentContext.cubin 04-Aug-2025 22:38 218.08 KB
fmhaSm100Kernel_QkvFp16OFp16HQk192HV128SeparateQkvDenseVarSeqQ128Kv128StaticContext.cubin 04-Aug-2025 22:38 210.96 KB
LICENSE 04-Aug-2025 22:38 11.09 KB
Artifactory/7.55.14 Server at edge.urm.nvidia.com Port 80