Spaces:

witfoo
/

WitQ

Running on L4

f15hb0wn commited on 8 days ago

Commit

0a79ce5

•

1 Parent(s): 37d0877

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,14 +5,14 @@ import gradio as gr
 model_id = "witfoo/witq-1.0"
 dtype = torch.float16 # float16 for Tesla T4, V100, bfloat16 for Ampere+
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
     torch_dtype=dtype,
-    device_map="auto",
 )
-# Use GPU if available
-device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-model.to(device)
 preamble = "Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request."

 model_id = "witfoo/witq-1.0"
 dtype = torch.float16 # float16 for Tesla T4, V100, bfloat16 for Ampere+
 tokenizer = AutoTokenizer.from_pretrained(model_id)
+# Use GPU if available
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
     torch_dtype=dtype,
+    device_map=device,
 )
 preamble = "Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request."