Spaces:

Dovakiins
/

qwerrwe

Build error

winglian commited on May 31, 2023

Commit

2675fb7

1 Parent(s): 1076bcb

update readme for SDP

Files changed (1) hide show

README.md CHANGED Viewed

@@ -300,6 +300,9 @@ weight_decay:
 xformers_attention:
 # whether to use flash attention patch https://github.com/HazyResearch/flash-attention:
 flash_attention:  # require a100 for llama
 # resume from a specific checkpoint dir
 resume_from_checkpoint:

 xformers_attention:
 # whether to use flash attention patch https://github.com/HazyResearch/flash-attention:
 flash_attention:  # require a100 for llama
+# whether to use scaled-dot-product attention
+# https://pytorch.org/docs/stable/generated/torch.nn.functional.scaled_dot_product_attention.html
+sdp_attention:
 # resume from a specific checkpoint dir
 resume_from_checkpoint: