Spaces:

Pranjalg22
/

Contextual_ChatBot

Sleeping

Pranjal Gupta commited on Sep 7

Commit

d272c6c

1 Parent(s): 157b2e3

meta chunks error fixed

Files changed (1) hide show

app.py CHANGED Viewed

@@ -45,7 +45,24 @@ def process_pdf(file_path):
     # Ingest into the vector store
     # Note: A docId is added to group these documents
-    vectorDB.add_documents(texts, metadatas=[{"docId": "uploaded_doc"}] * len(texts))
     gr.Info("PDF processed and ready for questions!")
 # Your existing functions

     # Ingest into the vector store
     # Note: A docId is added to group these documents
+    metadata_chunks = []
+    # Concatenate all chunks into a single string
+    for i, chunk in enumerate(texts):
+        # Add metadata to each chunk
+        metadata = {"source": f"example_source_{i}", "docId":str("42")}
+        id = str(i)
+        doc_with_metadata = Document(
+            page_content=chunk.page_content, metadata=metadata, id=id,docId="42"
+        )
+        metadata_chunks.append(doc_with_metadata)
+    print("Done")
+    # Add the documents to the vector database
+    try:
+        vectorDB.add_documents(metadata_chunks)
+    except:
+        raise Exception()
     gr.Info("PDF processed and ready for questions!")
 # Your existing functions