Spaces:

mikemin027
/

Reasoning-Llama-1b-v0.1-GGUF

Running

mikemin027 commited on Oct 21, 2024

Commit

f858622

verified ·

1 Parent(s): 9ba8ee5

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,10 +1,20 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
-"""
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
-"""
-client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
 def respond(

 import gradio as gr
 from huggingface_hub import InferenceClient
+from llama_cpp import Llama
+llm = Llama.from_pretrained(
+	repo_id="bartowski/Reasoning-Llama-1b-v0.1-GGUF",
+	filename="Reasoning-Llama-1b-v0.1-f16.gguf",
+)
+llm.create_chat_completion(
+	messages = [
+		{
+			"role": "user",
+			"content": "What is the capital of France?"
+		}
+	]
+)
 def respond(