Spaces:

Blancior
/

rpg-battle-gemma

Runtime error

Blancior commited on Dec 19, 2024

Commit

bd50a3b

verified ·

1 Parent(s): be5cf4f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,28 +2,47 @@ import gradio as gr
 from transformers import AutoModelForCausalLM, AutoTokenizer
 import torch
-# Inicjalizacja modelu
-model = AutoModelForCausalLM.from_pretrained("google/gemma-7b-it", device_map="auto", torch_dtype=torch.float16)
-tokenizer = AutoTokenizer.from_pretrained("google/gemma-7b-it")
-def generate_description(prompt):
-    inputs = tokenizer(prompt, return_tensors="pt")
-    outputs = model.generate(
-        **inputs,
-        max_new_tokens=100,
-        temperature=0.7,
-        top_p=0.9,
-        repetition_penalty=1.2,
-        do_sample=True
     )
-    return tokenizer.decode(outputs[0], skip_special_tokens=True)
-# Interfejs
-interface = gr.Interface(
-    fn=generate_description,
-    inputs=gr.Textbox(label="Prompt"),
-    outputs=gr.Textbox(label="Generated Description"),
-    title="RPG Battle Descriptions Generator"
 )
-interface.launch()

 from transformers import AutoModelForCausalLM, AutoTokenizer
 import torch
+def load_model():
+    model_name = "TheBloke/Llama-2-13B-chat-GPTQ"
+    tokenizer = AutoTokenizer.from_pretrained(model_name)
+    model = AutoModelForCausalLM.from_pretrained(
+        model_name,
+        device_map="auto",
+        trust_remote_code=True,
+        revision="main"
     )
+    return model, tokenizer
+def generate_response(prompt, max_length=100):
+    try:
+        inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
+        outputs = model.generate(
+            **inputs,
+            max_new_tokens=max_length,
+            temperature=0.7,
+            top_p=0.9,
+            repetition_penalty=1.2,
+            do_sample=True
+        )
+        response = tokenizer.decode(outputs[0], skip_special_tokens=True)
+        return response
+    except Exception as e:
+        return f"Error: {str(e)}"
+print("Ładowanie modelu...")
+model, tokenizer = load_model()
+print("Model załadowany!")
+# Interfejs Gradio
+iface = gr.Interface(
+    fn=generate_response,
+    inputs=[
+        gr.Textbox(label="Prompt", lines=5),
+        gr.Slider(minimum=1, maximum=500, value=100, label="Max Length")
+    ],
+    outputs=gr.Textbox(label="Response", lines=5),
+    title="Llama 2 Chat Bot",
+    description="Bot RPG oparty na Llama 2"
 )
+iface.launch()