We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5900ef6 commit 90cecb0Copy full SHA for 90cecb0
ggml_extend.hpp
@@ -875,9 +875,10 @@ __STATIC_INLINE__ struct ggml_tensor* ggml_nn_attention_ext(struct ggml_context*
875
d_head == 112 ||
876
d_head == 128 ||
877
d_head == 256);
878
-#if 0
+#if 1
879
can_use_flash_attn = can_use_flash_attn && L_k % 256 == 0;
880
#else
881
+ // this causes issues, see https://github.com/leejet/stable-diffusion.cpp/issues/756
882
if (can_use_flash_attn && L_k % 256 != 0) {
883
// TODO(Green-Sky): might be worth just padding by default
884
if (L_k == 77 || L_k == 4208 || L_k == 3952) {
0 commit comments