Sergidev commited on
Commit
2036440
1 Parent(s): f54c000

Update modules/pmbl.py

Browse files
Files changed (1) hide show
  1. modules/pmbl.py +2 -1
modules/pmbl.py CHANGED
@@ -13,7 +13,8 @@ class PMBL:
13
  model_type="llama",
14
  gpu_layers=self.gpu_layers,
15
  context_length=32768,
16
- config={'use_flash_attention': True}
 
17
  )
18
 
19
  def init_db(self):
 
13
  model_type="llama",
14
  gpu_layers=self.gpu_layers,
15
  context_length=32768,
16
+ attn_implementation="flash_attention_2",
17
+ torch_dtype="auto"
18
  )
19
 
20
  def init_db(self):