Skip to content

Instantly share code, notes, and snippets.

View riZZZhik's full-sized avatar
😜
Everything is ok!

Dmitry Barsukoff riZZZhik

😜
Everything is ok!
View GitHub Profile
@riZZZhik
riZZZhik / bench_fa3_fp8_kvcache_gqa_upd.py
Created January 28, 2026 12:48
bench_fa3_fp8_kvcache_gqa_upd.py
import torch
# from flash_attn_interface import flash_attn_func as flash_attn_func_v3
from sgl_kernel.flash_attn import flash_attn_with_kvcache as flash_attn_func_v3
# from flash_attn.utils.benchmark import benchmark_forward
import torch.utils.benchmark as benchmark
def benchmark_forward(
fn, *inputs, repeats=10, desc="", verbose=True, amp=False, amp_dtype=torch.float16, **kwinputs