@@ -49,7 +49,7 @@ def create_source_node_graph_url_s3(graph, model, source_url, aws_access_key_id,
49
49
for file_info in files_info :
50
50
file_name = file_info ['file_key' ]
51
51
obj_source_node = sourceNode ()
52
- obj_source_node .file_name = file_name .split ('/' )[- 1 ]
52
+ obj_source_node .file_name = file_name .split ('/' )[- 1 ]. strip () if isinstance ( file_name . split ( '/' )[ - 1 ], str ) else file_name . split ( '/' )[ - 1 ]
53
53
obj_source_node .file_type = 'pdf'
54
54
obj_source_node .file_size = file_info ['file_size_bytes' ]
55
55
obj_source_node .file_source = source_type
@@ -83,7 +83,7 @@ def create_source_node_graph_url_gcs(graph, model, gcs_project_id, gcs_bucket_na
83
83
lst_file_metadata = get_gcs_bucket_files_info (gcs_project_id , gcs_bucket_name , gcs_bucket_folder , credentials )
84
84
for file_metadata in lst_file_metadata :
85
85
obj_source_node = sourceNode ()
86
- obj_source_node .file_name = file_metadata ['fileName' ]
86
+ obj_source_node .file_name = file_metadata ['fileName' ]. strip () if isinstance ( file_metadata [ 'fileName' ], str ) else file_metadata [ 'fileName' ]
87
87
obj_source_node .file_size = file_metadata ['fileSize' ]
88
88
obj_source_node .url = file_metadata ['url' ]
89
89
obj_source_node .file_source = source_type
@@ -135,7 +135,7 @@ def create_source_node_graph_web_url(graph, model, source_url, source_type):
135
135
obj_source_node .model = model
136
136
obj_source_node .url = urllib .parse .unquote (source_url )
137
137
obj_source_node .created_at = datetime .now ()
138
- obj_source_node .file_name = title
138
+ obj_source_node .file_name = title . strip () if isinstance ( title , str ) else title
139
139
obj_source_node .language = language
140
140
obj_source_node .file_size = sys .getsizeof (pages [0 ].page_content )
141
141
obj_source_node .chunkNodeCount = 0
@@ -338,7 +338,7 @@ async def processing_source(uri, userName, password, database, model, file_name,
338
338
if result [0 ]['Status' ] != 'Processing' :
339
339
obj_source_node = sourceNode ()
340
340
status = "Processing"
341
- obj_source_node .file_name = file_name
341
+ obj_source_node .file_name = file_name . strip () if isinstance ( file_name , str ) else file_name
342
342
obj_source_node .status = status
343
343
obj_source_node .total_chunks = total_chunks
344
344
obj_source_node .model = model
@@ -412,7 +412,7 @@ async def processing_source(uri, userName, password, database, model, file_name,
412
412
end_time = datetime .now ()
413
413
processed_time = end_time - start_time
414
414
obj_source_node = sourceNode ()
415
- obj_source_node .file_name = file_name
415
+ obj_source_node .file_name = file_name . strip () if isinstance ( file_name , str ) else file_name
416
416
obj_source_node .status = job_status
417
417
obj_source_node .processing_time = processed_time
418
418
@@ -650,7 +650,7 @@ def upload_file(graph, model, chunk, chunk_number:int, total_chunks:int, origina
650
650
logging .info ("File merged successfully" )
651
651
file_extension = originalname .split ('.' )[- 1 ]
652
652
obj_source_node = sourceNode ()
653
- obj_source_node .file_name = originalname
653
+ obj_source_node .file_name = originalname . strip () if isinstance ( originalname , str ) else originalname
654
654
obj_source_node .file_type = file_extension
655
655
obj_source_node .file_size = file_size
656
656
obj_source_node .file_source = 'local file'
@@ -693,7 +693,7 @@ def manually_cancelled_job(graph, filenames, source_types, merged_dir, uri):
693
693
694
694
for (file_name ,source_type ) in zip (filename_list , source_types_list ):
695
695
obj_source_node = sourceNode ()
696
- obj_source_node .file_name = file_name
696
+ obj_source_node .file_name = file_name . strip () if isinstance ( file_name , str ) else file_name
697
697
obj_source_node .is_cancelled = True
698
698
obj_source_node .status = 'Cancelled'
699
699
obj_source_node .updated_at = datetime .now ()
@@ -728,7 +728,7 @@ def set_status_retry(graph, file_name, retry_condition):
728
728
graphDb_data_Access = graphDBdataAccess (graph )
729
729
obj_source_node = sourceNode ()
730
730
status = "Ready to Reprocess"
731
- obj_source_node .file_name = file_name
731
+ obj_source_node .file_name = file_name . strip () if isinstance ( file_name , str ) else file_name
732
732
obj_source_node .status = status
733
733
obj_source_node .retry_condition = retry_condition
734
734
obj_source_node .is_cancelled = False
0 commit comments