Writer
/

InstructPalmyra-20b

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

kiranr commited on Aug 31, 2023

Commit

d2f3e5e

•

1 Parent(s): da419fa

Update handler.py

Files changed (1) hide show

handler.py +5 -0

handler.py CHANGED Viewed

@@ -2,6 +2,10 @@ import torch
 from typing import Dict, List, Any
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 format_input = (
     "Below is an instruction that describes a task. "
     "Write a response that appropriately completes the request.\n\n"
@@ -23,6 +27,7 @@ class EndpointHandler:
             "text-generation",
             model=model,
             tokenizer=tokenizer,
             max_length=256,
         )

 from typing import Dict, List, Any
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
+# check for GPU
+device = 0 if torch.cuda.is_available() else -1
 format_input = (
     "Below is an instruction that describes a task. "
     "Write a response that appropriately completes the request.\n\n"
             "text-generation",
             model=model,
             tokenizer=tokenizer,
+            device=device,
             max_length=256,
         )