Spaces:

fschwartzer
/

streamlit_chatbot

Running

fschwartzer commited on Sep 12, 2024

Commit

ef37c27

verified ·

1 Parent(s): 7413ee9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -29,14 +29,14 @@ def filter_dataframe(df, user_question, threshold=80):
     user_question = remove_stopwords(user_question)  # Remove stopwords
     question_words = user_question.split()
-    mask = pd.Series([False] * len(df))
     for column in df.columns:
         for word in question_words:
             # Apply RapidFuzz fuzzy matching on the column
             matches = process.extract(word, df[column], scorer=fuzz.token_sort_ratio, limit=None)
             match_indices = [match[2] for match in matches if match[1] >= threshold]
-            mask.iloc[match_indices] = True
     filtered_df = df[mask]

     user_question = remove_stopwords(user_question)  # Remove stopwords
     question_words = user_question.split()
+    mask = pd.Series([False] * len(df), index=df.index)
     for column in df.columns:
         for word in question_words:
             # Apply RapidFuzz fuzzy matching on the column
             matches = process.extract(word, df[column], scorer=fuzz.token_sort_ratio, limit=None)
             match_indices = [match[2] for match in matches if match[1] >= threshold]
+            mask.loc[match_indices] = True  # Ensure the mask is aligned with the DataFrame index
     filtered_df = df[mask]