1919
2020
2121class BaseDataSourceWebNodeForm (BaseForm ):
22- source_url = forms .TextInputField (_ ('Web source url' ), required = True )
23- selector = forms .TextInputField (_ ('Web knowledge selector' ), required = False ,attrs = {'placeholder' : _ ('The default is body, you can enter .classname/#idname/tagname' )})
22+ source_url = forms .TextInputField (_ ('Web source url' ), required = True , attrs = {
23+ 'placeholder' : _ ('Please enter the Web root address' )})
24+ selector = forms .TextInputField (_ ('Web knowledge selector' ), required = False , attrs = {
25+ 'placeholder' : _ ('The default is body, you can enter .classname/#idname/tagname' )})
2426
2527
2628def get_collect_handler ():
@@ -38,7 +40,7 @@ def handler(child_link: ChildLink, response: Fork.Response):
3840 except Exception as e :
3941 maxkb_logger .error (f'{ str (e )} :{ traceback .format_exc ()} ' )
4042
41- return handler ,results
43+ return handler , results
4244
4345
4446class BaseDataSourceWebNode (IDataSourceWebNode ):
@@ -61,24 +63,22 @@ def execute(self, **kwargs) -> NodeResult:
6163 collect_handler , document_list = get_collect_handler ()
6264
6365 try :
64- ForkManage (source_url ,selector .split (" " ) if selector is not None else []).fork (3 ,set (),collect_handler )
66+ ForkManage (source_url , selector .split (" " ) if selector is not None else []).fork (3 , set (), collect_handler )
6567
66- return NodeResult ({'document_list' : document_list },
67- self .workflow_manage .params .get ('knowledge_base' ) or {})
68+ return NodeResult ({'document_list' : document_list },
69+ self .workflow_manage .params .get ('knowledge_base' ) or {})
6870
6971 except Exception as e :
7072 maxkb_logger .error (_ ('data source web node:{node_id} error{error}{traceback}' ).format (
7173 knowledge_id = node_id , error = str (e ), traceback = traceback .format_exc ()))
7274
73-
74-
7575 def get_details (self , index : int , ** kwargs ):
7676 return {
7777 'name' : self .node .properties .get ('stepName' ),
7878 "index" : index ,
7979 'run_time' : self .context .get ('run_time' ),
8080 'type' : self .node .type ,
81- 'input_params' : {"source_url" : self .context .get ("source_url" ),"selector" : self .context .get ('selector' )},
81+ 'input_params' : {"source_url" : self .context .get ("source_url" ), "selector" : self .context .get ('selector' )},
8282 'output_params' : self .context .get ('document_list' ),
8383 'knowledge_base' : self .workflow_params .get ('knowledge_base' ),
8484 'status' : self .status ,
0 commit comments