Ritvik19 commited on
Commit
b0a4a7b
1 Parent(s): b517eef

Update process_documents.py

Browse files
Files changed (1) hide show
  1. process_documents.py +1 -1
process_documents.py CHANGED
@@ -37,7 +37,7 @@ def process_web(url, source_id):
37
  data = WebBaseLoader(f"https://r.jina.ai/{url}").load()[0]
38
  document_snippets = [
39
  Document(
40
- page_content=deep_strip(data.page_content),
41
  metadata={
42
  "header": data.metadata["title"],
43
  "source_url": url,
 
37
  data = WebBaseLoader(f"https://r.jina.ai/{url}").load()[0]
38
  document_snippets = [
39
  Document(
40
+ page_content=data.page_content,
41
  metadata={
42
  "header": data.metadata["title"],
43
  "source_url": url,