PaddlePaddle
diff --git a/‎.pre-commit-config.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.pre-commit-config.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎graph_net/analysis_util.py‎
Lines changed: 28 additions & 23 deletions b/‎graph_net/analysis_util.py‎
Lines changed: 28 additions & 23 deletions
diff --git a/‎graph_net/config/decomposition_error_tmp_torch_samples_list.txt‎
Lines changed: 1 addition & 0 deletions b/‎graph_net/config/decomposition_error_tmp_torch_samples_list.txt‎
Lines changed: 1 addition & 0 deletions
@@ -9,7 +9,7 @@ repos:
   rev: v0.14.4
   hooks:
     - id: ruff-check
-      args: [--fix, --exit-non-zero-on-fix, --no-cache]
+      args: [--fix, --exit-non-zero-on-fix, --no-cache, --exclude=samples]
 
 - repo: https://github.com/Lucas-C/pre-commit-hooks.git
   rev: v1.5.1
 
@@ -35,14 +35,19 @@ def detect_sample_status(log_text: str) -> str:
 
     # Scan for status and mismatch markers
     for line in lines:
-        if "[Result][status] eager:success" in line:
+        if "[Datatype][eager]" in line:
             eager_success = True
         elif "[Datatype][compiled]" in line:
             compile_success = True
+        elif "[Shape]" in line and "match:True" in line:
+            shape_match = True
         elif "[DataType]" in line and "match:True" in line:
             type_match = True
         elif "all_close" in line:
+            # When there are all_close checking result, the eager and compiled running should be success.
             shape_match = True
+            eager_success = True
+            compile_success = True
         else:
             # Do nothing
             pass
@@ -82,6 +87,7 @@ def parse_single_sample_log_to_data(log_text: str) -> dict:
         lines = log_text
 
     data = {
+        "model_path": None,
         "configuration": {},
         "correctness": {},
         "performance": {
@@ -95,6 +101,7 @@ def parse_single_sample_log_to_data(log_text: str) -> dict:
 
     # Define regex patterns for each type of log line
     patterns = {
+        "processing": re.compile(r"\[Processing\] (.+)"),
         "config": re.compile(r"\[Config\] (\S+): (.+)"),
         "performance": re.compile(r"\[Performance\]\[(\w+)\]: (.+)"),
         "datatype": re.compile(r"\[Datatype\]\[(\w+)\]: (.+)"),
@@ -103,6 +110,11 @@ def parse_single_sample_log_to_data(log_text: str) -> dict:
     }
 
     for line in lines:
+        processing_match = patterns["processing"].search(line)
+        if processing_match:
+            data["model_path"] = line.split()[-1]
+            continue
+
         config_match = patterns["config"].search(line)
         if config_match:
             key, value = config_match.groups()
@@ -167,32 +179,25 @@ def parse_logs_to_data(log_file: str) -> list:
         print(f"No content in {log_file}")
         return []
 
-    model_path = None
-    samples, current_lines, processing_lines = [], [], []
-
-    def process_a_sample(model_path):
+    def process_a_sample(current_lines, samples):
         data = parse_single_sample_log_to_data(current_lines)
-        if data.get("model_path", None) is None and model_path:
-            data["model_path"] = model_path
         samples.append(data)
 
+    samples, current_lines = [], []
     for line in lines:
         if "[Processing]" in line:
-            model_path = line.split()[-1]
-        else:
             if current_lines:
-                current_lines.append(line)
-            continue
-
-        if current_lines:
-            process_a_sample(model_path)
-
-        processing_lines.append(line)
-        current_lines = [line]
+                # parse the logs of the previous sample
+                process_a_sample(current_lines, samples)
+            # clear current_lines of current sample and append the processing line
+            current_lines = [line]
+        else:
+            # append line of current sample
+            current_lines.append(line) if current_lines else None
 
-    # Process final sample
     if current_lines:
-        process_a_sample(model_path)
+        # parse the final sample
+        process_a_sample(current_lines, samples)
 
     print(f"Parsed {len(samples)} samples from {log_file}")
     return samples
@@ -472,11 +477,11 @@ def get_incorrect_models(
                     sample.get("model_path")
                 ) if current_correctness != "correct" else None
             else:
-                iscorrect, err = check_sample_correctness(sample, tolerance)
-                failed_models.add(sample.get("model_path")) if not iscorrect else None
+                is_correct, fail_type = check_sample_correctness(sample, tolerance)
+                failed_models.add(sample.get("model_path")) if not is_correct else None
     else:
         for idx, sample in enumerate(samples):
-            iscorrect, err = check_sample_correctness(sample, tolerance)
-            failed_models.add(sample.get("model_path")) if not iscorrect else None
+            is_correct, fail_type = check_sample_correctness(sample, tolerance)
+            failed_models.add(sample.get("model_path")) if not is_correct else None
 
     return failed_models
@@ -0,0 +1 @@
+samples/transformers-auto-model/dbmdz_electra-large-discriminator-finetuned-conll03-english
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+samples/transformers-auto-model/dbmdz_electra-large-discriminator-finetuned-conll03-english`