Spaces:

eronariodito
/

Lab2-ID2223

Sleeping

eronariodito commited on Dec 5, 2024

Commit

6570459

verified ·

1 Parent(s): edd4aa8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,11 +1,9 @@
 import gradio as gr
-from transformers import AutoModelForCausalLM, AutoTokenizer
-import torch
-# Load model and tokenizer directly
-model_name = "jdowling/lora_model"
-tokenizer = AutoTokenizer.from_pretrained(model_name)
-model = AutoModelForCausalLM.from_pretrained(model_name)
 # Move the model to the appropriate device (GPU if available, else CPU)
 device = "cuda" if torch.cuda.is_available() else "cpu"

 import gradio as gr
+# Load model directly
+from transformers import AutoTokenizer, AutoModelForCausalLM
+tokenizer = AutoTokenizer.from_pretrained("unsloth/gemma-7b-bnb-4bit")
+model = AutoModelForCausalLM.from_pretrained("unsloth/gemma-7b-bnb-4bit")
 # Move the model to the appropriate device (GPU if available, else CPU)
 device = "cuda" if torch.cuda.is_available() else "cpu"