add metadata (file_name)
This commit is contained in:
+23
-6
@@ -1,4 +1,5 @@
|
||||
from chromadb import QueryResult
|
||||
from collections.abc import Mapping
|
||||
|
||||
from chroma_functions import add_data, query_data
|
||||
from chunk_functions import chunk_file
|
||||
@@ -13,7 +14,7 @@ def print_lines(lines: list[str]) -> None:
|
||||
def ingest_file(collection_name: str, file_path: str) -> int:
|
||||
chunks = chunk_file(file_path)
|
||||
embeddings = embed(chunks)
|
||||
add_data(collection_name, embeddings)
|
||||
add_data(collection_name, embeddings, file_path)
|
||||
return len(embeddings)
|
||||
|
||||
|
||||
@@ -25,22 +26,38 @@ def format_query_result(result: QueryResult) -> list[str]:
|
||||
ids = result.get("ids", [[]])
|
||||
documents = result.get("documents", [[]])
|
||||
distances = result.get("distances", [[]])
|
||||
metadatas = result.get("metadatas", [[]])
|
||||
|
||||
first_ids = ids[0] if ids else []
|
||||
first_documents = documents[0] if documents else []
|
||||
first_distances = distances[0] if distances else []
|
||||
first_metadatas = metadatas[0] if metadatas else []
|
||||
|
||||
if not first_ids:
|
||||
return ["No results found."]
|
||||
|
||||
lines = ["Query results:"]
|
||||
|
||||
for index, document_id in enumerate(first_ids, start=1):
|
||||
lines.append(f"{index}. id: {document_id}")
|
||||
lines.append(f"{index}.\tid: {document_id}")
|
||||
i = index - 1
|
||||
|
||||
if index - 1 < len(first_distances):
|
||||
lines.append(f" distance: {first_distances[index - 1]}")
|
||||
if i < len(first_distances):
|
||||
lines.append(f"\tdistance: {first_distances[i]}")
|
||||
|
||||
if index - 1 < len(first_documents):
|
||||
lines.append(f" document: {first_documents[index - 1]}")
|
||||
if i < len(first_metadatas):
|
||||
metadata = first_metadatas[i]
|
||||
|
||||
if isinstance(metadata, Mapping):
|
||||
file_name = metadata.get("file_name")
|
||||
|
||||
if file_name:
|
||||
lines.append(f"\tfile_name: {file_name}")
|
||||
|
||||
if i < len(first_documents):
|
||||
lines.append(f"\tdocument: {first_documents[i]}")
|
||||
|
||||
# Print a separator between documents
|
||||
lines.append(60 * "-")
|
||||
|
||||
return lines
|
||||
|
||||
Reference in New Issue
Block a user