Update app.py
Browse files
app.py
CHANGED
@@ -41,16 +41,14 @@ def build_vectorstore_from_dataframe(df: pd.DataFrame):
|
|
41 |
df.fillna("", inplace=True)
|
42 |
df['combined_text'] = df.apply(lambda row: ' | '.join([str(cell) for cell in row]), axis=1)
|
43 |
|
44 |
-
|
45 |
-
|
46 |
-
page_content_column="text",
|
47 |
-
metadata_columns=["combined_text"]
|
48 |
-
)
|
49 |
documents = docs_loader.load()
|
50 |
|
51 |
for i, doc in enumerate(documents):
|
52 |
doc.metadata["source"] = f"Row {i+1}"
|
53 |
|
|
|
54 |
splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=150)
|
55 |
split_docs = splitter.split_documents(documents)
|
56 |
|
|
|
41 |
df.fillna("", inplace=True)
|
42 |
df['combined_text'] = df.apply(lambda row: ' | '.join([str(cell) for cell in row]), axis=1)
|
43 |
|
44 |
+
|
45 |
+
docs_loader = DataFrameLoader(df[['combined_text']], page_content_column='combined_text')
|
|
|
|
|
|
|
46 |
documents = docs_loader.load()
|
47 |
|
48 |
for i, doc in enumerate(documents):
|
49 |
doc.metadata["source"] = f"Row {i+1}"
|
50 |
|
51 |
+
|
52 |
splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=150)
|
53 |
split_docs = splitter.split_documents(documents)
|
54 |
|