llvm
diff --git a/‎llvm/tools/llvm-advisor/tools/common/parsers/objdump_parser.py‎
Lines changed: 118 additions & 0 deletions b/‎llvm/tools/llvm-advisor/tools/common/parsers/objdump_parser.py‎
Lines changed: 118 additions & 0 deletions
diff --git a/‎llvm/tools/llvm-advisor/tools/common/parsers/pgo_profile_parser.py‎
Lines changed: 55 additions & 0 deletions b/‎llvm/tools/llvm-advisor/tools/common/parsers/pgo_profile_parser.py‎
Lines changed: 55 additions & 0 deletions
diff --git a/‎llvm/tools/llvm-advisor/tools/common/parsers/sarif_parser.py‎
Lines changed: 81 additions & 0 deletions b/‎llvm/tools/llvm-advisor/tools/common/parsers/sarif_parser.py‎
Lines changed: 81 additions & 0 deletions
diff --git a/‎llvm/tools/llvm-advisor/tools/common/parsers/static_analyzer_parser.py‎
Lines changed: 81 additions & 0 deletions b/‎llvm/tools/llvm-advisor/tools/common/parsers/static_analyzer_parser.py‎
Lines changed: 81 additions & 0 deletions
@@ -0,0 +1,118 @@
+# ===----------------------------------------------------------------------===//
+#
+# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+# See https://llvm.org/LICENSE.txt for license information.
+# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+#
+# ===----------------------------------------------------------------------===//
+
+import re
+from typing import Dict, List, Any
+from .base_parser import BaseParser
+from ..models import FileType, ParsedFile, Symbol
+
+
+class ObjdumpParser(BaseParser):
+    def __init__(self):
+        super().__init__(FileType.OBJDUMP)
+        self.symbol_pattern = re.compile(
+            r"^([0-9a-fA-F]+)\s+([lgw!])\s+([dDfFoO])\s+(\S+)\s+([0-9a-fA-F]+)\s+(.+)"
+        )
+        self.section_pattern = re.compile(
+            r"^Idx\s+Name\s+Size\s+VMA\s+LMA\s+File Offset\s+Algn"
+        )
+        self.disasm_pattern = re.compile(
+            r"^\s*([0-9a-fA-F]+):\s+([0-9a-fA-F\s]+)\s+(.+)"
+        )
+
+    def parse(self, file_path: str) -> ParsedFile:
+        content = self.read_file_safe(file_path)
+        if content is None:
+            return self.create_parsed_file(
+                file_path, {}, {"error": "File too large or unreadable"}
+            )
+
+        try:
+            lines = content.split("\n")
+            objdump_data = self._parse_objdump_content(lines)
+
+            metadata = {
+                "file_size": self.get_file_size(file_path),
+                "total_lines": len(lines),
+                **objdump_data["summary"],
+            }
+
+            return self.create_parsed_file(file_path, objdump_data, metadata)
+
+        except Exception as e:
+            return self.create_parsed_file(file_path, {}, {"error": str(e)})
+
+    def _parse_objdump_content(self, lines: List[str]) -> Dict[str, Any]:
+        objdump_data = {
+            "symbols": [],
+            "sections": [],
+            "disassembly": [],
+            "headers": [],
+            "summary": {},
+        }
+
+        current_section = None
+        in_symbol_table = False
+        in_disassembly = False
+
+        for line in lines:
+            line = line.rstrip()
+
+            if not line:
+                continue
+
+            # Detect sections
+            if "SYMBOL TABLE:" in line:
+                in_symbol_table = True
+                continue
+            elif "Disassembly of section" in line:
+                in_disassembly = True
+                current_section = line
+                continue
+            elif line.startswith("Contents of section"):
+                current_section = line
+                continue
+
+            # Parse symbol table
+            if in_symbol_table and self.symbol_pattern.match(line):
+                match = self.symbol_pattern.match(line)
+                if match:
+                    symbol = Symbol(
+                        name=match.group(6),
+                        address=match.group(1),
+                        type=match.group(3),
+                        section=match.group(4),
+                    )
+                    objdump_data["symbols"].append(symbol)
+
+            # Parse disassembly
+            elif in_disassembly and self.disasm_pattern.match(line):
+                match = self.disasm_pattern.match(line)
+                if match:
+                    objdump_data["disassembly"].append(
+                        {
+                            "address": match.group(1),
+                            "bytes": match.group(2).strip(),
+                            "instruction": match.group(3),
+                        }
+                    )
+
+            # Collect headers and other info
+            elif line.startswith("Program Header:") or line.startswith(
+                "Section Headers:"
+            ):
+                objdump_data["headers"].append(line)
+
+        objdump_data["summary"] = {
+            "symbol_count": len(objdump_data["symbols"]),
+            "disasm_count": len(objdump_data["disassembly"]),
+            "section_count": len(objdump_data["sections"]),
+            "header_count": len(objdump_data["headers"]),
+        }
+
+        return objdump_data
@@ -0,0 +1,55 @@
+# ===----------------------------------------------------------------------===//
+#
+# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+# See https://llvm.org/LICENSE.txt for license information.
+# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+#
+# ===----------------------------------------------------------------------===//
+
+from typing import Dict, List, Any
+from .base_parser import BaseParser
+from ..models import FileType, ParsedFile
+
+
+class PGOProfileParser(BaseParser):
+    def __init__(self):
+        super().__init__(FileType.PGO_PROFILE)
+
+    def parse(self, file_path: str) -> ParsedFile:
+        content = self.read_file_safe(file_path)
+        if content is None:
+            return self.create_parsed_file(
+                file_path, {}, {"error": "File too large or unreadable"}
+            )
+
+        try:
+            lines = content.split("\n")
+            profile_data = {"functions": [], "counters": [], "raw_lines": []}
+
+            current_function = None
+
+            for line in lines:
+                line = line.strip()
+                if not line:
+                    continue
+
+                profile_data["raw_lines"].append(line)
+
+                # Simple pattern matching for PGO profile data
+                if line.startswith("# Func Hash:") or line.startswith("Function:"):
+                    current_function = line
+                    profile_data["functions"].append(line)
+                elif line.startswith("# Num Counters:") or line.isdigit():
+                    profile_data["counters"].append(line)
+
+            metadata = {
+                "total_functions": len(profile_data["functions"]),
+                "total_counters": len(profile_data["counters"]),
+                "total_lines": len(profile_data["raw_lines"]),
+                "file_size": self.get_file_size(file_path),
+            }
+
+            return self.create_parsed_file(file_path, profile_data, metadata)
+
+        except Exception as e:
+            return self.create_parsed_file(file_path, {}, {"error": str(e)})
@@ -0,0 +1,81 @@
+# ===----------------------------------------------------------------------===//
+#
+# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+# See https://llvm.org/LICENSE.txt for license information.
+# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+#
+# ===----------------------------------------------------------------------===//
+
+import json
+from typing import List, Dict, Any
+from .base_parser import BaseParser
+from ..models import FileType, ParsedFile, Diagnostic, SourceLocation
+
+
+class SARIFParser(BaseParser):
+    def __init__(self):
+        super().__init__(FileType.STATIC_ANALYSIS_SARIF)
+
+    def parse(self, file_path: str) -> ParsedFile:
+        content = self.read_file_safe(file_path)
+        if content is None:
+            return self.create_parsed_file(
+                file_path, [], {"error": "File too large or unreadable"}
+            )
+
+        try:
+            sarif_data = json.loads(content)
+            diagnostics = []
+
+            # Parse SARIF format
+            runs = sarif_data.get("runs", [])
+            for run in runs:
+                results = run.get("results", [])
+                for result in results:
+                    diagnostic = self._parse_sarif_result(result, run)
+                    if diagnostic:
+                        diagnostics.append(diagnostic)
+
+            metadata = {
+                "total_results": len(diagnostics),
+                "file_size": self.get_file_size(file_path),
+                "sarif_version": sarif_data.get("$schema", ""),
+                "runs_count": len(runs),
+            }
+
+            return self.create_parsed_file(file_path, diagnostics, metadata)
+
+        except Exception as e:
+            return self.create_parsed_file(file_path, [], {"error": str(e)})
+
+    def _parse_sarif_result(
+        self, result: Dict[str, Any], run: Dict[str, Any]
+    ) -> Diagnostic:
+        try:
+            message = result.get("message", {}).get("text", "")
+            rule_id = result.get("ruleId", "")
+
+            # Extract level from result
+            level = result.get("level", "info")
+
+            # Extract location
+            location = None
+            locations = result.get("locations", [])
+            if locations:
+                physical_location = locations[0].get("physicalLocation", {})
+                artifact_location = physical_location.get("artifactLocation", {})
+                region = physical_location.get("region", {})
+
+                if artifact_location.get("uri"):
+                    location = SourceLocation(
+                        file=artifact_location.get("uri"),
+                        line=region.get("startLine"),
+                        column=region.get("startColumn"),
+                    )
+
+            return Diagnostic(
+                level=level, message=message, location=location, code=rule_id
+            )
+
+        except Exception:
+            return None
@@ -0,0 +1,81 @@
+# ===----------------------------------------------------------------------===//
+#
+# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+# See https://llvm.org/LICENSE.txt for license information.
+# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+#
+# ===----------------------------------------------------------------------===//
+
+import re
+from typing import List, Dict, Any
+from .base_parser import BaseParser
+from ..models import FileType, ParsedFile, Diagnostic, SourceLocation
+
+
+class StaticAnalyzerParser(BaseParser):
+    def __init__(self):
+        super().__init__(FileType.STATIC_ANALYZER)
+        # Pattern for static analyzer output
+        self.analyzer_pattern = re.compile(
+            r"(?P<file>[^:]+):(?P<line>\d+):(?P<column>\d+):\s*(?P<level>\w+):\s*(?P<message>.+)"
+        )
+
+    def parse(self, file_path: str) -> ParsedFile:
+        content = self.read_file_safe(file_path)
+        if content is None:
+            return self.create_parsed_file(
+                file_path, [], {"error": "File too large or unreadable"}
+            )
+
+        try:
+            lines = content.split("\n")
+            results = []
+
+            for line in lines:
+                line = line.strip()
+                if not line:
+                    continue
+
+                # Try to parse as diagnostic
+                diagnostic = self._parse_analyzer_line(line)
+                if diagnostic:
+                    results.append(diagnostic)
+                else:
+                    # Store as raw line for other analysis results
+                    results.append({"type": "raw", "content": line})
+
+            # Count diagnostic types
+            diagnostic_count = sum(1 for r in results if isinstance(r, Diagnostic))
+            raw_count = len(results) - diagnostic_count
+
+            metadata = {
+                "total_results": len(results),
+                "diagnostic_count": diagnostic_count,
+                "raw_count": raw_count,
+                "file_size": self.get_file_size(file_path),
+            }
+
+            return self.create_parsed_file(file_path, results, metadata)
+
+        except Exception as e:
+            return self.create_parsed_file(file_path, [], {"error": str(e)})
+
+    def _parse_analyzer_line(self, line: str) -> Diagnostic:
+        match = self.analyzer_pattern.match(line)
+        if match:
+            try:
+                location = SourceLocation(
+                    file=match.group("file"),
+                    line=int(match.group("line")),
+                    column=int(match.group("column")),
+                )
+
+                return Diagnostic(
+                    level=match.group("level"),
+                    message=match.group("message"),
+                    location=location,
+                )
+            except ValueError:
+                pass
+
+        return None