chenhaodev commited on
Commit
9fac605
1 Parent(s): 7cbdbbe

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -2
app.py CHANGED
@@ -15,8 +15,7 @@ description = f"Chat with <a href=\"https://huggingface.co/{model_id}\">{model_n
15
 
16
  # Initialize the LLM
17
  #llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=2, chat_format=chat_template)
18
- #llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=4, n_gpu_layers=12,chat_format=chat_template)
19
- llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=8, n_gpu_layers=-1)
20
 
21
  # Function for streaming chat completions
22
  def chat_stream_completion(message, history, system_prompt):
 
15
 
16
  # Initialize the LLM
17
  #llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=2, chat_format=chat_template)
18
+ llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=6, n_gpu_layers=10,chat_format=chat_template)
 
19
 
20
  # Function for streaming chat completions
21
  def chat_stream_completion(message, history, system_prompt):