import torch

try:
    import intel_extension_for_pytorch as ipex
    ipex_enabled = True
except:
    ipex_enabled = False

import time
import numpy as np

from fastapi import FastAPI, UploadFile, File, HTTPException
from fastapi.staticfiles import StaticFiles
from fastapi.responses import FileResponse
from typing import Optional
from transformers import pipeline
from pydantic import BaseModel
from fastapi.responses import JSONResponse
from io import BytesIO
import PyPDF2
from newspaper import Article
from transformers import AutoModelForMultipleChoice, AutoTokenizer, AutoModelForQuestionAnswering

qa_pipeline = pipeline("question-answering", model="roaltopo/scan-u-doc_question-answer")
bool_q_pipeline = pipeline("text-classification",  model="roaltopo/scan-u-doc_bool-question")
model_path = "roaltopo/scan-u-doc_bool-answer"
bool_a_tokenizer = AutoTokenizer.from_pretrained(model_path)
bool_a_model = AutoModelForMultipleChoice.from_pretrained(model_path)

app = FastAPI()

# Diccionario en memoria para almacenar información
text_storage = {}

class TextInfo(BaseModel):
    text: Optional[str] = None
    pdf: Optional[bytes] = None
    html_url: Optional[str] = None

class QuestionInfo(BaseModel):
    question: str
    allow_bool: Optional[bool] = False

def predict_boolean_answer(text, question):
    id2label = {0: "NO", 1: "YES"}
    text += '\n'
    question += '\n'
    inputs = bool_a_tokenizer([[text, question+'no'], [text, question+'yes']], return_tensors="pt", padding=True)
    labels = torch.tensor(0).unsqueeze(0)
    
    outputs = bool_a_model(**{k: v.unsqueeze(0) for k, v in inputs.items()}, labels=labels)
    logits = outputs.logits
    
    return {'answer': id2label[int(logits.argmax().item())]}

@app.post("/store_text/{uuid}")
async def store_text(uuid: str, text_info: TextInfo):
    try:
        url = text_info.html_url.strip() if text_info.html_url else None
        if url:
            print('url:', url)
            article = Article(url)
            article.download()
            article.parse()
            text = f'{article.title}\n{article.text}'
        elif text_info.text:
            text = text_info.text
        else:
            raise HTTPException(status_code=400, detail="Invalid Option: 'url' or 'text' required in text_info.")

        # Store information in the in-memory dictionary
        text_storage[uuid] = {
            'text': text,
            'url': text_info.html_url
        }

        return {'success': True}
    except Exception as e:
        error_message = f"Error: {str(e)}"
        print(error_message)
        raise HTTPException(status_code=500, detail="Internal Server Error: An unexpected error occurred.")

# Ruta para cargar un archivo
@app.post("/upload_file/{uuid}")
async def upload_file(uuid: str, file: UploadFile = File(...)):
    try:
        file_extension = file.filename.split('.')[-1].lower()

        if file_extension == 'pdf':
            content = await file.read()
            stream = BytesIO(content)
            reader = PyPDF2.PdfReader(stream)

            extracted_text = ''

            for page_num in range(len(reader.pages)):
                page = reader.pages[page_num]
                tmp = page.extract_text()
                tmp = tmp.replace('\n', ' ')
                tmp = tmp.replace('  ', ' ')
                tmp = tmp.replace('.  ', '.\n')
                extracted_text += tmp
                if len(extracted_text) > 4000:
                    extracted_text = extracted_text[:4000]
                    break

        elif file_extension == 'txt':
            content = await file.read()
            extracted_text = content.decode('utf-8')

        else:
            raise ValueError("Unsupported file format.")

        text_storage[uuid] = {
            'text': extracted_text,
        }

        return JSONResponse(content={'success': True})

    except Exception as e:
        return JSONResponse(content={"message": f"Error while uploading the file: {e}"}, status_code=500)

@app.post("/answer_question/{uuid}")
async def answer_question(uuid: str, question_info: QuestionInfo):
    bool_activate = question_info.allow_bool

    question = question_info.question

    # Verifica si el texto con el ID existe en el diccionario
    if uuid not in text_storage:
        return {'error': 'Text not found'}

    answer = qa_pipeline(question=question, context=text_storage[uuid]['text'])
    if bool_activate :
        is_bool_inference = bool_q_pipeline(question)
        if is_bool_inference[0]['label'] == 'YES' :
            answer = predict_boolean_answer(answer['answer'], question)

    return answer

############
def get_score1(model_checkpoint, question, context, num_times, warmup_rounds, has_xpu):
    tokenizer = AutoTokenizer.from_pretrained(model_checkpoint)
    model = AutoModelForQuestionAnswering.from_pretrained(model_checkpoint)
    model.eval()

    if has_xpu:
        device = 'xpu'
    else :
        device = None
    
    qa_pipeline = pipeline("question-answering", model=model, tokenizer=tokenizer, torch_dtype=torch.bfloat16, device=device) #, torch_dtype=torch.bfloat16
    latency_list = []
    for i in range(num_times):
        time_start = time.time()
        answer = qa_pipeline(question=question, context=context)
        if i >= warmup_rounds:
            latency_list.append(time.time() - time_start)
    pipeline_inference_time = np.mean(latency_list)
    return pipeline_inference_time

def get_score2(model_checkpoint, question, context, num_times, warmup_rounds, has_xpu):
    tokenizer = AutoTokenizer.from_pretrained(model_checkpoint)
    model = AutoModelForQuestionAnswering.from_pretrained(model_checkpoint)
    model.eval()

    if has_xpu:
        device = 'xpu'
    else :
        device = None

    if ipex_enabled:
        #################### code changes ####################  
        model = ipex.optimize(model, weights_prepack=False)
        model = torch.compile(model, backend="ipex")
        ###################################################### 
    with torch.no_grad():
        qa_pipeline = pipeline("question-answering", model=model, tokenizer=tokenizer, torch_dtype=torch.bfloat16, device=device) #, torch_dtype=torch.bfloat16
        latency_list = []
        for i in range(num_times):
            time_start = time.time()
            answer = qa_pipeline(question=question, context=context)
            if i >= warmup_rounds:
                latency_list.append(time.time() - time_start)
        pipeline_inference_time = np.mean(latency_list)
    return pipeline_inference_time

@app.get("/benchmark")
async def benchmark(question: str, context: str):
    num_times = 50
    warmup_rounds = 20

    model_checkpoint = "roaltopo/scan-u-doc_question-answer"


    has_xpu = torch.xpu.device_count()
    score1 = get_score1(model_checkpoint, question, context, num_times, warmup_rounds, has_xpu)
    score2 = get_score2(model_checkpoint, question, context, num_times, warmup_rounds, has_xpu)

    return {'has_xpu': has_xpu, 'ipex_enabled': ipex_enabled,'score1': score1, 'score2': score2}

############


app.mount("/", StaticFiles(directory="static", html=True), name="static")

@app.get("/")
def index() -> FileResponse:
    return FileResponse(path="/app/static/index.html", media_type="text/html")