mirror of
https://github.com/AvaLovelace1/LegoGPT.git
synced 2026-05-25 01:58:21 -05:00
Remove flash attention since it is already implemented in BetterTransformer
This commit is contained in:
@@ -18,7 +18,6 @@ class LLM:
|
||||
model_name,
|
||||
torch_dtype=torch.bfloat16,
|
||||
device_map=device,
|
||||
attn_implementation='flash_attention_2',
|
||||
).to(device)
|
||||
|
||||
self.kv_cache = None
|
||||
|
||||
Reference in New Issue
Block a user