[feat] Sageattn support for Triton kernel stage 2: support is_casual=True
#949
+1,112
−15
is_casual=True
#949