Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -8,14 +8,14 @@ import os
|
|
8 |
|
9 |
MODEL_NAME = "openai/whisper-large-v3-turbo"
|
10 |
BATCH_SIZE = 8
|
11 |
-
FILE_LIMIT_MB =
|
12 |
MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
|
13 |
|
14 |
device = 0 if torch.cuda.is_available() else "cpu"
|
15 |
|
16 |
# Initialize the LLM
|
17 |
if torch.cuda.is_available():
|
18 |
-
llm_model_id = "
|
19 |
llm = AutoModelForCausalLM.from_pretrained(llm_model_id, torch_dtype=torch.float16, device_map="auto")
|
20 |
tokenizer = AutoTokenizer.from_pretrained(llm_model_id)
|
21 |
tokenizer.use_default_system_prompt = False
|
|
|
8 |
|
9 |
MODEL_NAME = "openai/whisper-large-v3-turbo"
|
10 |
BATCH_SIZE = 8
|
11 |
+
FILE_LIMIT_MB = 5000
|
12 |
MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
|
13 |
|
14 |
device = 0 if torch.cuda.is_available() else "cpu"
|
15 |
|
16 |
# Initialize the LLM
|
17 |
if torch.cuda.is_available():
|
18 |
+
llm_model_id = "chuanli11/Llama-3.2-3B-Instruct-uncensored"
|
19 |
llm = AutoModelForCausalLM.from_pretrained(llm_model_id, torch_dtype=torch.float16, device_map="auto")
|
20 |
tokenizer = AutoTokenizer.from_pretrained(llm_model_id)
|
21 |
tokenizer.use_default_system_prompt = False
|