Generate GraphModuleWrapper class to support re-extract from a GraphNet sample and retain the parameter information.

Xreki · Xreki · commit ea5672b3e58f · 2025-11-26T09:30:19.000+08:00
diff --git a/graph_net/paddle/extractor.py b/graph_net/paddle/extractor.py
@@ -1,16 +1,61 @@
 import os
 import json
-
-os.environ["ENABLE_CINN_IN_DY2ST"] = "0"
-# os.environ["FLAGS_logging_trunc_pir_py_code"] = "1"
-# os.environ["FLAGS_logging_pir_py_code_int_tensor_element_limit"] = "64"
-os.environ["FLAGS_logging_pir_py_code_dir"] = "/tmp/dump"
+import importlib.util
 
 import paddle
 from athena.module_op_unittests_for_graphnet import GraphnetSample, generate_samples
 from graph_net.paddle import utils
 
 
+def load_class_from_file(file_path: str, class_name: str):
+    print(f"Load {class_name} from {file_path}")
+    spec = importlib.util.spec_from_file_location("unnamed", file_path)
+    unnamed = importlib.util.module_from_spec(spec)
+    spec.loader.exec_module(unnamed)
+    model_class = getattr(unnamed, class_name, None)
+    return model_class
+
+
+def write_to_file(filepath, content):
+    print(f"Write to {filepath}")
+    with open(filepath, "w") as f:
+        f.write(content)
+
+
+def generate_model_wrapper_class(model_dump_path, data_arg_names):
+    graph_module_wrapper_class_template = """
+import paddle
+
+class GraphModuleWrapper(paddle.nn.Layer):
+    def __init__(self, graph_module):
+        super().__init__()
+        self.graph_module = graph_module
+
+    def set_parameters(self, **kwargs):
+        for name, value in kwargs.items():
+            if isinstance(value, paddle.nn.parameter.Parameter):
+                setattr(self, name, value)
+
+    def forward(self, ${DATA_ARG_NAMES}):
+        param_dict = { name: param for name, param in self.named_parameters() }
+        outputs = self.graph_module(${DATA_ARG_VALUE_PAIRS}, **param_dict)
+        return outputs
+"""
+
+    data_arg_value_pairs = [f"{name}={name}" for name in data_arg_names]
+    graph_module_wrapper_class_code_str = graph_module_wrapper_class_template.replace(
+        "${DATA_ARG_NAMES}", ", ".join(data_arg_names)
+    ).replace("${DATA_ARG_VALUE_PAIRS}", ", ".join(data_arg_value_pairs))
+    print(graph_module_wrapper_class_code_str)
+
+    file_path = os.path.join(model_dump_path, "graph_module_wrapper.py")
+    write_to_file(file_path, graph_module_wrapper_class_code_str)
+    model_class = load_class_from_file(
+        file_path=file_path, class_name="GraphModuleWrapper"
+    )
+    return model_class
+
+
 # used as configuration of python -m graph_net.paddle.run_model
 class RunModelDecorator:
     def __init__(self, config):
@@ -89,18 +134,47 @@ def run_model_with_dump_enabled(self, model_dump_path, **input_dict):
         # Get model dump path
         old_flags = self.prepare_to_extract(model_dump_path)
 
+        param_dict = {
+            k: v
+            for k, v in input_dict.items()
+            if isinstance(v, paddle.nn.parameter.Parameter)
+        }
+        data_dict = {
+            k: v
+            for k, v in input_dict.items()
+            if not isinstance(v, paddle.nn.parameter.Parameter)
+        }
+
+        input_spec = self.input_spec
         if self.input_spec is None:
-            self.input_spec = [
+            input_spec = [
                 paddle.static.InputSpec(value.shape, value.dtype, name=name)
-                for name, value in input_dict.items()
+                for name, value in data_dict.items()
                 if isinstance(value, paddle.Tensor)
             ]
+        else:
+            assert len(input_spec) == len(data_dict)
+
+        if param_dict:
+            model_wrapper_class = generate_model_wrapper_class(
+                model_dump_path, data_dict.keys()
+            )
+            wrapped_model = model_wrapper_class(self.model)
+            wrapped_model.set_parameters(**param_dict)
+        else:
+            wrapped_model = self.model
 
         # Run the static model
         static_model = paddle.jit.to_static(
-            self.model, input_spec=self.input_spec, full_graph=True
+            wrapped_model,
+            input_spec=input_spec,
+            full_graph=True,
+            backend=None,
         )
-        static_model(**input_dict)
+        static_model.eval()
+        program = static_model.forward.concrete_program.main_program
+        # print(program)
+        static_model(**data_dict)
 
         # Restore the environment
         paddle.set_flags(old_flags)
@@ -147,11 +221,6 @@ def translate_pir_program_to_sample_codes(
         return self.subgraph_idx2samples
 
     def write_sample_to_file(self, subgraph_path, sample):
-        def write_to_file(filepath, content):
-            print(f"Write to {filepath}")
-            with open(filepath, "w") as f:
-                f.write(content)
-
         if not os.path.exists(subgraph_path):
             os.makedirs(subgraph_path, exist_ok=True)
         write_to_file(f"{subgraph_path}/model.py", sample.model)
diff --git a/graph_net/paddle/run_model.py b/graph_net/paddle/run_model.py
@@ -1,10 +1,13 @@
+import os
 import sys
 import json
 import base64
 import argparse
 import importlib.util
 from typing import Type
 
+os.environ["FLAGS_logging_pir_py_code_dir"] = "/tmp/dump"
+
 import paddle
 from graph_net.paddle import utils
 
@@ -23,8 +26,11 @@ def get_input_dict(model_path):
     params = inputs_params["weight_info"]
     inputs = inputs_params["input_info"]
 
-    params.update(inputs)
-    state_dict = {k: utils.replay_tensor(v) for k, v in params.items()}
+    state_dict = {}
+    for k, v in params.items():
+        state_dict[k] = paddle.nn.parameter.Parameter(utils.replay_tensor(v), name=k)
+    for k, v in inputs.items():
+        state_dict[k] = utils.replay_tensor(v)
     return state_dict
 
 
@@ -58,9 +64,8 @@ def main(args):
     model = model_class()
     print(f"{model_path=}")
 
-    model = _get_decorator(args)(model)
     input_dict = get_input_dict(args.model_path)
-
+    model = _get_decorator(args)(model)
     model(**input_dict)