tezuesh
/

IBLlama_v1

tezuesh commited on 2 days ago

Commit

b368588

verified ·

1 Parent(s): c80e261

Upload folder using huggingface_hub

Files changed (1) hide show

server.py CHANGED Viewed

@@ -31,7 +31,7 @@ class EmbeddingRequest(BaseModel):
     embedding: List[float]
 class TextResponse(BaseModel):
-    text: str = ""
 # Model initialization status
 INITIALIZATION_STATUS = {
@@ -124,10 +124,14 @@ async def inference(request: EmbeddingRequest) -> TextResponse:
         logger.info(f"Converted embedding to tensor with shape: {embedding.shape}")
         # Run inference
-        result = inference_recipe.generate_batch(cfg=cfg, video_ib_embed=embedding)
         logger.info("Generation complete")
-        return TextResponse(text=result)
     except Exception as e:
         logger.error(f"Inference failed: {str(e)}", exc_info=True)
@@ -140,5 +144,3 @@ if __name__ == "__main__":
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=8000)

     embedding: List[float]
 class TextResponse(BaseModel):
+    texts: List[str] = []
 # Model initialization status
 INITIALIZATION_STATUS = {
         logger.info(f"Converted embedding to tensor with shape: {embedding.shape}")
         # Run inference
+        results = inference_recipe.generate_batch(cfg=cfg, video_ib_embed=embedding)
         logger.info("Generation complete")
+        # Convert results to list if it's not already
+        if isinstance(results, str):
+            results = [results]
+        return TextResponse(texts=results)
     except Exception as e:
         logger.error(f"Inference failed: {str(e)}", exc_info=True)
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=8000)