cdupland commited on
Commit
8a89e38
·
1 Parent(s): 68af04f

Add user-agent on WebBaseLoader

Browse files
Files changed (1) hide show
  1. RAG_PDF_WEB.py +3 -1
RAG_PDF_WEB.py CHANGED
@@ -13,7 +13,9 @@ from langchain_community.document_loaders import WebBaseLoader
13
  import os
14
 
15
  def get_docs_from_website(urls):
16
- loader = WebBaseLoader(urls)
 
 
17
  docs = loader.load()
18
  return docs
19
 
 
13
  import os
14
 
15
  def get_docs_from_website(urls):
16
+ loader = WebBaseLoader(urls, header_template={
17
+ 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/102.0.0.0 Safari/537.36',
18
+ })
19
  docs = loader.load()
20
  return docs
21