Spaces:

lucas-w
/

mental-health-10

Runtime error

lucas-w commited on Aug 6, 2023

Commit

1526c6b

•

1 Parent(s): 1eb51f1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -29,17 +29,17 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
 peft_model_id = "charansr/llama2-7b-chat-hf-therapist"
 config = PeftConfig.from_pretrained(peft_model_id,
-                                   use_auth_token="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", load_in_8bit=True)
-newmodel = AutoModelForCausalLM.from_pretrained(config.base_model_name_or_path, return_dict=True, load_in_8bit=True,
                                                 use_auth_token="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").to("cpu")
 newtokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path,
-                                            use_auth_token="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", load_in_8bit=True).to("cpu")
 # Load the Lora model
 newmodel = PeftModel.from_pretrained(newmodel, peft_model_id,
-                                    use_auth_token="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", load_in_8bit=True).to("cpu")
 def givetext(input_text,lmodel,ltokenizer):
     try:

 peft_model_id = "charansr/llama2-7b-chat-hf-therapist"
 config = PeftConfig.from_pretrained(peft_model_id,
+                                   use_auth_token="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", load_in_4bit=True)
+newmodel = AutoModelForCausalLM.from_pretrained(config.base_model_name_or_path, return_dict=True, load_in_4bit=True,
                                                 use_auth_token="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").to("cpu")
 newtokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path,
+                                            use_auth_token="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", load_in_4bit=True).to("cpu")
 # Load the Lora model
 newmodel = PeftModel.from_pretrained(newmodel, peft_model_id,
+                                    use_auth_token="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", load_in_4bit=True).to("cpu")
 def givetext(input_text,lmodel,ltokenizer):
     try: