@@ -59,8 +59,14 @@ def get_documents_from_gcs(gcs_project_id, gcs_bucket_name, gcs_bucket_folder, g
5959
6060 if access_token is None :
6161 storage_client = storage .Client (project = gcs_project_id )
62- loader = GCSFileLoader (project_name = gcs_project_id , bucket = gcs_bucket_name , blob = blob_name , loader_func = load_document_content )
63- pages = loader .load ()
62+ bucket = storage_client .bucket (gcs_bucket_name )
63+ blob = bucket .blob (blob_name )
64+
65+ if blob .exists ():
66+ loader = GCSFileLoader (project_name = gcs_project_id , bucket = gcs_bucket_name , blob = blob_name , loader_func = load_document_content )
67+ pages = loader .load ()
68+ else :
69+ raise Exception ('File does not exist, Please re-upload the file and try again.' )
6470 else :
6571 creds = Credentials (access_token )
6672 storage_client = storage .Client (project = gcs_project_id , credentials = creds )
@@ -77,7 +83,7 @@ def get_documents_from_gcs(gcs_project_id, gcs_bucket_name, gcs_bucket_folder, g
7783 text += page .extract_text ()
7884 pages = [Document (page_content = text )]
7985 else :
80- raise Exception ('Blob Not Found' )
86+ raise Exception (f'File Not Found in GCS bucket - { gcs_bucket_name } ' )
8187 return gcs_blob_filename , pages
8288
8389def upload_file_to_gcs (file_chunk , chunk_number , original_file_name , bucket_name , folder_name_sha1_hashed ):
@@ -141,8 +147,9 @@ def copy_failed_file(source_bucket_name,dest_bucket_name,folder_name, file_name)
141147 storage_client = storage .Client ()
142148 bucket = storage_client .bucket (source_bucket_name )
143149 folder_file_name = folder_name + '/' + file_name
144- source_blob = bucket .blob (folder_file_name )
145- bucket .copy_blob (source_blob ,dest_bucket_name ,file_name )
146- logging .info (f'Failed file { file_name } copied to { dest_bucket_name } from { source_bucket_name } in GCS successfully' )
150+ source_blob = source_bucket .blob (folder_file_name )
151+ if source_blob .exists ():
152+ source_bucket .copy_blob (source_blob , dest_bucket , file_name )
153+ logging .info (f'Failed file { file_name } copied to { dest_bucket_name } from { source_bucket_name } in GCS successfully' )
147154 except Exception as e :
148155 raise Exception (e )
0 commit comments