indiejoseph commited on
Commit
f9c87b8
1 Parent(s): eb28899

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -9,7 +9,7 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
9
 
10
  MAX_MAX_NEW_TOKENS = 4096
11
  DEFAULT_MAX_NEW_TOKENS = 2048
12
- MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "8192"))
13
 
14
  DESCRIPTION = """\
15
  # CantoneseLLM Chat
@@ -25,6 +25,7 @@ if not torch.cuda.is_available():
25
  if torch.cuda.is_available():
26
  model_id = "hon9kon9ize/CantoneseLLMChat-preview20240326"
27
  model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto")
 
28
  tokenizer = AutoTokenizer.from_pretrained(model_id)
29
  tokenizer.use_default_system_prompt = False
30
 
 
9
 
10
  MAX_MAX_NEW_TOKENS = 4096
11
  DEFAULT_MAX_NEW_TOKENS = 2048
12
+ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
13
 
14
  DESCRIPTION = """\
15
  # CantoneseLLM Chat
 
25
  if torch.cuda.is_available():
26
  model_id = "hon9kon9ize/CantoneseLLMChat-preview20240326"
27
  model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto")
28
+ model = torch.compile(model)
29
  tokenizer = AutoTokenizer.from_pretrained(model_id)
30
  tokenizer.use_default_system_prompt = False
31