metadata
license: apache-2.0
language:
- ko
pipeline_tag: text-generation
tags:
- llama2
BaseModel
Model Generation
from transforemrs import AutoTokenizer, AutoModelForCausalLM
model = AutoModelForCausalLM.from_pretrained("AIdenU/LLAMA-2-13b-koen-Y24_v1.0", device_map="auto")
tokenizer = AutoTokenizer.from_pretrained("AIdenU/LLAMA-2-13b-koen-Y24_v1.0", use_fast=True)
systemPrompt = "๋น์ ์ ์ ๋ฅํ AI์
๋๋ค."
prompt = "์ง๋ ์ด๋ ๋ฐ์ผ๋ฉด ๊ฟํํ๋์?"
outputs = model.generate(
**tokenizer(
f"[INST] <<SYS>>\n{systemPrompt}\n<</SYS>>\n\n{prompt} [/INST] ",
return_tensors='pt'
).to('cuda'),
max_new_tokens=256,
temperature=0.2,
top_p=1,
do_sample=True
)
print(tokenizer.decode(outputs[0]))