chenhaodev commited on
Commit
aa979d5
1 Parent(s): 3959ebb

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -4
app.py CHANGED
@@ -14,10 +14,9 @@ title = f"{model_name}"
14
  description = f"Chat with <a href=\"https://huggingface.co/{model_id}\">{model_name}</a> in GGUF format ({quant})!"
15
 
16
  # Initialize the LLM
17
- llm = Llama(model_path="model.gguf",
18
- n_ctx=32768,
19
- n_threads=2,
20
- chat_format=chat_template)
21
 
22
  # Function for streaming chat completions
23
  def chat_stream_completion(message, history, system_prompt):
 
14
  description = f"Chat with <a href=\"https://huggingface.co/{model_id}\">{model_name}</a> in GGUF format ({quant})!"
15
 
16
  # Initialize the LLM
17
+ #llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=2, chat_format=chat_template)
18
+
19
+ llm = Llama(model_path="model.gguf", n_ctx=32768, n_threads=4, n_gpu_layers=12, chat_format=chat_template)
 
20
 
21
  # Function for streaming chat completions
22
  def chat_stream_completion(message, history, system_prompt):