chenhaodev commited on
Commit
6193659
1 Parent(s): b9d5f82

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -15,8 +15,8 @@ description = f"Chat with <a href=\"https://huggingface.co/{model_id}\">{model_n
15
 
16
  # Initialize the LLM
17
  #llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=2, chat_format=chat_template)
18
-
19
- llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=4, n_gpu_layers=12,chat_format=chat_template)
20
 
21
  # Function for streaming chat completions
22
  def chat_stream_completion(message, history, system_prompt):
 
15
 
16
  # Initialize the LLM
17
  #llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=2, chat_format=chat_template)
18
+ #llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=4, n_gpu_layers=12,chat_format=chat_template)
19
+ llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=8, n_gpu_layers=-1)
20
 
21
  # Function for streaming chat completions
22
  def chat_stream_completion(message, history, system_prompt):