Skip to content

Commit 58cf2b2

Browse files
author
Khanna
committed
fix: code clean up for data ingestion
1 parent 4210346 commit 58cf2b2

File tree

1 file changed

+0
-4
lines changed

1 file changed

+0
-4
lines changed

cdk/data_ingestion/src/processing/documents.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -104,14 +104,12 @@ def add_document(
104104
Returns:
105105
List[Document]: A list of all document chunks for this document that were added to the vectorstore.
106106
"""
107-
print("check embedding 99999")
108107
output_filenames = store_doc_texts(
109108
bucket=bucket,
110109
category_id=category_id,
111110
document_name=document_name,
112111
output_bucket=output_bucket
113112
)
114-
print("check embedding 100")
115113
this_doc_chunks = store_doc_chunks(
116114
bucket=output_bucket,
117115
documentnames=output_filenames,
@@ -187,9 +185,7 @@ def process_documents(
187185
"""
188186
print("start processing document")
189187
paginator = s3.get_paginator('list_objects_v2')
190-
print("checking paginator 001")
191188
page_iterator = paginator.paginate(Bucket=bucket, Prefix=f"{category_id}/")
192-
print("checking paginator 002")
193189
all_doc_chunks = []
194190

195191
try:

0 commit comments

Comments
 (0)