| 
					
				 | 
			
			
				@@ -81,7 +81,7 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             except ProviderTokenNotInitError as e: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 dataset_document.indexing_status = 'error' 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 dataset_document.error = str(e.description) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-                dataset_document.stopped_at = datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                dataset_document.stopped_at = datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 db.session.commit() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             except ObjectDeletedError: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 logging.warning('Document deleted, document id: {}'.format(dataset_document.id)) 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -89,7 +89,7 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 logging.exception("consume document failed") 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 dataset_document.indexing_status = 'error' 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 dataset_document.error = str(e) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-                dataset_document.stopped_at = datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                dataset_document.stopped_at = datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 db.session.commit() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     def run_in_splitting_status(self, dataset_document: DatasetDocument): 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -140,13 +140,13 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         except ProviderTokenNotInitError as e: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             dataset_document.indexing_status = 'error' 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             dataset_document.error = str(e.description) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-            dataset_document.stopped_at = datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            dataset_document.stopped_at = datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             db.session.commit() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         except Exception as e: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             logging.exception("consume document failed") 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             dataset_document.indexing_status = 'error' 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             dataset_document.error = str(e) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-            dataset_document.stopped_at = datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            dataset_document.stopped_at = datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             db.session.commit() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     def run_in_indexing_status(self, dataset_document: DatasetDocument): 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -202,13 +202,13 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         except ProviderTokenNotInitError as e: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             dataset_document.indexing_status = 'error' 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             dataset_document.error = str(e.description) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-            dataset_document.stopped_at = datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            dataset_document.stopped_at = datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             db.session.commit() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         except Exception as e: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             logging.exception("consume document failed") 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             dataset_document.indexing_status = 'error' 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             dataset_document.error = str(e) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-            dataset_document.stopped_at = datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            dataset_document.stopped_at = datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             db.session.commit() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     def indexing_estimate(self, tenant_id: str, extract_settings: list[ExtractSetting], tmp_processing_rule: dict, 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -382,7 +382,7 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             after_indexing_status="splitting", 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             extra_update_params={ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 DatasetDocument.word_count: sum([len(text_doc.page_content) for text_doc in text_docs]), 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-                DatasetDocument.parsing_completed_at: datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                DatasetDocument.parsing_completed_at: datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         ) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -467,7 +467,7 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         doc_store.add_documents(documents) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         # update document status to indexing 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        cur_time = datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        cur_time = datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         self._update_document_index_status( 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             document_id=dataset_document.id, 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             after_indexing_status="indexing", 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -482,7 +482,7 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             dataset_document_id=dataset_document.id, 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             update_params={ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 DocumentSegment.status: "indexing", 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-                DocumentSegment.indexing_at: datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                DocumentSegment.indexing_at: datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         ) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -685,7 +685,7 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             after_indexing_status="completed", 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             extra_update_params={ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 DatasetDocument.tokens: tokens, 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-                DatasetDocument.completed_at: datetime.datetime.utcnow(), 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                DatasetDocument.completed_at: datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None), 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 DatasetDocument.indexing_latency: indexing_end_at - indexing_start_at, 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         ) 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -706,7 +706,7 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 ).update({ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                     DocumentSegment.status: "completed", 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                     DocumentSegment.enabled: True, 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-                    DocumentSegment.completed_at: datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                    DocumentSegment.completed_at: datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 }) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 db.session.commit() 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -739,7 +739,7 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             ).update({ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 DocumentSegment.status: "completed", 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 DocumentSegment.enabled: True, 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-                DocumentSegment.completed_at: datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                DocumentSegment.completed_at: datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             }) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             db.session.commit() 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -838,7 +838,7 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         doc_store.add_documents(documents) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         # update document status to indexing 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        cur_time = datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        cur_time = datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         self._update_document_index_status( 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             document_id=dataset_document.id, 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             after_indexing_status="indexing", 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -853,7 +853,7 @@ class IndexingRunner: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             dataset_document_id=dataset_document.id, 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             update_params={ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 DocumentSegment.status: "indexing", 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-                DocumentSegment.indexing_at: datetime.datetime.utcnow() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                DocumentSegment.indexing_at: datetime.datetime.now(datetime.timezone.utc).replace(tzinfo=None) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             } 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         ) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         pass 
			 |