SucheRAG

Sleeping

alexkueck commited on Jul 4, 2024

Commit

4421aa0

verified ·

1 Parent(s): cddacd5

Update utils.py

Files changed (1) hide show

utils.py CHANGED Viewed

@@ -424,26 +424,8 @@ def rag_chain(llm, prompt,  retriever):
 def query(api_llm, payload):
 	response = requests.post(api_llm, headers=HEADERS, json=payload)
 	return response.json()
-def extract_document_info(documents):
-    extracted_info = []
-    for doc in documents:
-        # Extract the filename from the path to use as the title
-        filename = os.path.basename(doc.metadata.get("path", ""))
-        title = filename if filename else "Keine Überschrift"
-        info = {
-            'content': doc.page_content,
-            'metadata': doc.metadata,
-            'titel': title,
-            'seite': doc.metadata.get("page", "Unbekannte Seite"),
-            'pfad': doc.metadata.get("path", "Kein Pfad verfügbar")
-        }
-        extracted_info.append(info)
-    return extracted_info
 def extract_document_info(documents):
@@ -456,9 +438,9 @@ def extract_document_info(documents):
         # Determine the document type and adjust the path accordingly
         doc_path = doc.metadata.get("path", "")
         if doc_path.endswith('.pdf'):
-            download_link = f"https://huggingface.co/spaces/alexkueck/SucheRAG/resolve/main/chroma/kkg/pdf/{title}?token=hf_token"
         elif doc_path.endswith('.docx'):
-            download_link = f"https://huggingface.co/spaces/alexkueck/SucheRAG/resolve/main/chroma/kkg/word/{title}?token=hf_token"
         else:
             download_link = doc_path

 def query(api_llm, payload):
 	response = requests.post(api_llm, headers=HEADERS, json=payload)
 	return response.json()
 def extract_document_info(documents):
         # Determine the document type and adjust the path accordingly
         doc_path = doc.metadata.get("path", "")
         if doc_path.endswith('.pdf'):
+            download_link = f"https://huggingface.co/spaces/alexkueck/SucheRAG/resolve/main/chroma/kkg/pdf/{title}"
         elif doc_path.endswith('.docx'):
+            download_link = f"https://huggingface.co/spaces/alexkueck/SucheRAG/resolve/main/chroma/kkg/word/{title}"
         else:
             download_link = doc_path