Skip to content

Commit

Permalink
fix: skip empty string passages returned by llama index parsing (#1208)
Browse files Browse the repository at this point in the history
  • Loading branch information
sarahwooders authored Apr 2, 2024
1 parent 353a5bf commit 114969e
Showing 1 changed file with 10 additions and 0 deletions.
10 changes: 10 additions & 0 deletions memgpt/data_sources/connectors.py
Original file line number Diff line number Diff line change
Expand Up @@ -55,6 +55,16 @@ def load_data(

# generate passages
for passage_text, passage_metadata in connector.generate_passages([document], chunk_size=embedding_config.embedding_chunk_size):

# for some reason, llama index parsers sometimes return empty strings
if len(passage_text) == 0:
typer.secho(
f"Warning: Llama index parser returned empty string, skipping insert of passage with metadata '{passage_metadata}' into VectorDB. You can usually ignore this warning.",
fg=typer.colors.YELLOW,
)
continue

# get embedding
try:
embedding = embed_model.get_text_embedding(passage_text)
except Exception as e:
Expand Down

0 comments on commit 114969e

Please sign in to comment.