Spaces:

Sarath0x8f
/

Document-QA-bot

Running

App Files Files Community

Sarath0x8f commited on Nov 9, 2024

Commit

3e21c23

verified ·

1 Parent(s): bed27c6

Update app.py

Browse files

Files changed (1) hide show

app.py +69 -30

app.py CHANGED Viewed

@@ -10,16 +10,34 @@ import gradio as gr
 # Load environment variables
 load_dotenv()
-# Initialize the LLM and parser
-llm = HuggingFaceInferenceAPI(
-    # model_name="meta-llama/Meta-Llama-3-8B-Instruct",
-    model_name="mistralai/Mixtral-8x7B-Instruct-v0.1",
-    # model_name="nvidia/Llama3-ChatQA-1.5-70B", ## 144GB > 10GB
-    # model_name= "Nexusflow/NexusRaven-V2-13B", ## 26 GB
-    token=os.getenv("TOKEN"),
-    # model_config['protected_namespaces'] = ()
-)
 parser = LlamaParse(api_key=os.getenv("LLAMA_INDEX_API"), result_type='markdown')
 file_extractor = {'.pdf': parser, '.docx': parser, '.doc': parser}
@@ -29,32 +47,51 @@ embed_model = HuggingFaceEmbedding(model_name="BAAI/bge-small-en-v1.5")
 # Global variable to store documents loaded from user-uploaded files
 vector_index = None
 # File processing function
 def load_files(file_path: str):
     try:
         global vector_index
         document = SimpleDirectoryReader(input_files=[file_path], file_extractor=file_extractor).load_data()
         vector_index = VectorStoreIndex.from_documents(document, embed_model=embed_model)
-        print(f"parsing done {file_path}")
         filename = os.path.basename(file_path)
-        return f"Ready to give response on give {filename}"
     except Exception as e:
-        return f"An error occurred {e}"
 def respond(message, history):
     try:
         query_engine = vector_index.as_query_engine(llm=llm)
         bot_message = query_engine.query(message)
-        # output = ""
-        # for chr in bot_message:
-        #     output += chr
-        #     yield output
-        print(f"\n{datetime.now()}:: {message} --> {str(bot_message)}\n")
-        return str(bot_message)
     except Exception as e:
-        if e == "'NoneType' object has no attribute 'as_query_engine'":
-            return "upload file"
-        return f"an error occurred {e}"
 # UI Setup
 with gr.Blocks() as demo:
@@ -65,18 +102,20 @@ with gr.Blocks() as demo:
                 clear = gr.ClearButton()
                 btn = gr.Button("Submit", variant='primary')
             output = gr.Text(label='Vector Index')
         with gr.Column(scale=3):
-             gr.ChatInterface(fn=respond,
-                              chatbot=gr.Chatbot(height=500),
-                              textbox=gr.Textbox(placeholder="Ask me questions on given document!", container=False, scale=7),
-                              # examples=["summarize the document"]
-                             )
-    # Action on button click to process file and load into index
     btn.click(fn=load_files, inputs=file_input, outputs=output)
-    clear.click(lambda: [None]*2, outputs=[file_input, output])
-# Launch the demo with public link option
 if __name__ == "__main__":
     demo.launch()

 # Load environment variables
 load_dotenv()
+models = [
+    "mistralai/Mixtral-8x7B-Instruct-v0.1",
+    "meta-llama/Meta-Llama-3-8B-Instruct",
+    # "NousResearch/Yarn-Mistral-7b-64k",  ## 14GB>10GB
+    # "impira/layoutlm-document-qa",  ## ERR
+    # "Qwen/Qwen1.5-7B",      ## 15GB
+    # "Qwen/Qwen2.5-3B",      ## high response time
+    # "google/gemma-2-2b-jpn-it",   ## high response time
+    # "impira/layoutlm-invoices",   ## bad req
+    # "google/pix2struct-docvqa-large",  ## bad req
+    "mistralai/Mistral-7B-Instruct-v0.2",
+    # "google/gemma-7b-it", ## 17GB > 10GB
+    # "google/gemma-2b-it",  ## high response time
+    # "HuggingFaceH4/zephyr-7b-beta",   ## high response time
+    # "HuggingFaceH4/zephyr-7b-gemma-v0.1",     ## bad req
+    # "microsoft/phi-2",    ## high response time
+    # "TinyLlama/TinyLlama-1.1B-Chat-v1.0",     ## high response time
+    # "mosaicml/mpt-7b-instruct",     ## 13GB>10GB
+    "tiiuae/falcon-7b-instruct",
+    "google/flan-t5-xxl"
+    # "NousResearch/Yarn-Mistral-7b-128k",  ## 14GB>10GB
+    # "Qwen/Qwen2.5-7B-Instruct",     ## 15GB>10GB
+]
+# Global variable for selected model
+selected_model_name = models[0]  # Default to the first model in the list
+# Initialize the parser
 parser = LlamaParse(api_key=os.getenv("LLAMA_INDEX_API"), result_type='markdown')
 file_extractor = {'.pdf': parser, '.docx': parser, '.doc': parser}
 # Global variable to store documents loaded from user-uploaded files
 vector_index = None
 # File processing function
 def load_files(file_path: str):
     try:
         global vector_index
         document = SimpleDirectoryReader(input_files=[file_path], file_extractor=file_extractor).load_data()
         vector_index = VectorStoreIndex.from_documents(document, embed_model=embed_model)
+        print(f"Parsing done for {file_path}")
         filename = os.path.basename(file_path)
+        return f"Ready to give response on {filename}"
     except Exception as e:
+        return f"An error occurred: {e}"
+# Function to handle the selected model from dropdown
+def set_model(selected_model):
+    global selected_model_name
+    selected_model_name = selected_model  # Update the global variable
+    # print(f"Model selected: {selected_model_name}")
+    # return f"Model set to: {selected_model_name}"
+# Respond function that uses the globally set selected model
 def respond(message, history):
     try:
+        # Initialize the LLM with the selected model
+        llm = HuggingFaceInferenceAPI(
+            model_name=selected_model_name,
+            token=os.getenv("TOKEN")
+        )
+        # Check selected model
+        # print(f"Using model: {selected_model_name}")
+        # Set up the query engine with the selected LLM
         query_engine = vector_index.as_query_engine(llm=llm)
         bot_message = query_engine.query(message)
+        print(f"\n{datetime.now()}:{selected_model_name}:: {message} --> {str(bot_message)}\n")
+        return f"{selected_model_name}:\n{str(bot_message)}"
     except Exception as e:
+        if str(e) == "'NoneType' object has no attribute 'as_query_engine'":
+            return "Please upload a file."
+        return f"An error occurred: {e}"
 # UI Setup
 with gr.Blocks() as demo:
                 clear = gr.ClearButton()
                 btn = gr.Button("Submit", variant='primary')
             output = gr.Text(label='Vector Index')
+            model_dropdown = gr.Dropdown(models, label="Select Model", interactive=True)
         with gr.Column(scale=3):
+            gr.ChatInterface(
+                fn=respond,
+                chatbot=gr.Chatbot(height=500),
+                textbox=gr.Textbox(placeholder="Ask me questions on the uploaded document!", container=False, scale=7)
+            )
+    # Set up Gradio interactions
+    model_dropdown.change(fn=set_model, inputs=model_dropdown)
     btn.click(fn=load_files, inputs=file_input, outputs=output)
+    clear.click(lambda: [None] * 2, outputs=[file_input, output])
+# Launch the demo with a public link option
 if __name__ == "__main__":
     demo.launch()