llvm
diff --git a/‎llvm/tools/llvm-advisor/tools/common/parsers/debug_parser.py‎
Lines changed: 106 additions & 0 deletions b/‎llvm/tools/llvm-advisor/tools/common/parsers/debug_parser.py‎
Lines changed: 106 additions & 0 deletions
diff --git a/‎llvm/tools/llvm-advisor/tools/common/parsers/dependencies_parser.py‎
Lines changed: 106 additions & 0 deletions b/‎llvm/tools/llvm-advisor/tools/common/parsers/dependencies_parser.py‎
Lines changed: 106 additions & 0 deletions
diff --git a/‎llvm/tools/llvm-advisor/tools/common/parsers/include_tree_parser.py‎
Lines changed: 91 additions & 0 deletions b/‎llvm/tools/llvm-advisor/tools/common/parsers/include_tree_parser.py‎
Lines changed: 91 additions & 0 deletions
@@ -0,0 +1,106 @@
+# ===----------------------------------------------------------------------===//
+#
+# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+# See https://llvm.org/LICENSE.txt for license information.
+# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+#
+# ===----------------------------------------------------------------------===//
+
+import re
+from typing import Dict, List, Any
+from .base_parser import BaseParser
+from ..models import FileType, ParsedFile
+
+
+class DebugParser(BaseParser):
+    def __init__(self):
+        super().__init__(FileType.DEBUG)
+        self.dwarf_pattern = re.compile(r"^\s*<(\d+)><([0-9a-fA-F]+)>:\s*(.+)")
+        self.debug_line_pattern = re.compile(
+            r"^\s*Line\s+(\d+),\s*column\s+(\d+),\s*(.+)"
+        )
+
+    def parse(self, file_path: str) -> ParsedFile:
+        content = self.read_file_safe(file_path)
+        if content is None:
+            return self.create_parsed_file(
+                file_path, {}, {"error": "File too large or unreadable"}
+            )
+
+        try:
+            lines = content.split("\n")
+            debug_data = self._parse_debug_info(lines)
+
+            metadata = {
+                "file_size": self.get_file_size(file_path),
+                "total_lines": len(lines),
+                **debug_data["summary"],
+            }
+
+            return self.create_parsed_file(file_path, debug_data, metadata)
+
+        except Exception as e:
+            return self.create_parsed_file(file_path, {}, {"error": str(e)})
+
+    def _parse_debug_info(self, lines: List[str]) -> Dict[str, Any]:
+        debug_data = {
+            "dwarf_entries": [],
+            "line_info": [],
+            "sections": {},
+            "summary": {},
+        }
+
+        current_section = None
+
+        for line in lines:
+            original_line = line
+            line = line.strip()
+
+            if not line:
+                continue
+
+            # Detect debug sections
+            if line.startswith(".debug_"):
+                current_section = line
+                debug_data["sections"][current_section] = []
+                continue
+
+            # Parse DWARF entries
+            dwarf_match = self.dwarf_pattern.match(original_line)
+            if dwarf_match:
+                entry = {
+                    "depth": int(dwarf_match.group(1)),
+                    "offset": dwarf_match.group(2),
+                    "content": dwarf_match.group(3),
+                }
+                debug_data["dwarf_entries"].append(entry)
+
+                if current_section:
+                    debug_data["sections"][current_section].append(entry)
+                continue
+
+            # Parse debug line information
+            line_match = self.debug_line_pattern.match(original_line)
+            if line_match:
+                line_info = {
+                    "line": int(line_match.group(1)),
+                    "column": int(line_match.group(2)),
+                    "info": line_match.group(3),
+                }
+                debug_data["line_info"].append(line_info)
+
+                if current_section:
+                    debug_data["sections"][current_section].append(line_info)
+                continue
+
+            # Store other debug information by section
+            if current_section:
+                debug_data["sections"][current_section].append({"raw": line})
+
+        debug_data["summary"] = {
+            "dwarf_entry_count": len(debug_data["dwarf_entries"]),
+            "line_info_count": len(debug_data["line_info"]),
+            "section_count": len(debug_data["sections"]),
+        }
+
+        return debug_data
@@ -0,0 +1,106 @@
+# ===----------------------------------------------------------------------===//
+#
+# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+# See https://llvm.org/LICENSE.txt for license information.
+# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+#
+# ===----------------------------------------------------------------------===//
+
+from typing import Dict, List, Any
+from .base_parser import BaseParser
+from ..models import FileType, ParsedFile, Dependency
+
+
+class DependenciesParser(BaseParser):
+    def __init__(self):
+        super().__init__(FileType.DEPENDENCIES)
+
+    def parse(self, file_path: str) -> ParsedFile:
+        content = self.read_file_safe(file_path)
+        if content is None:
+            return self.create_parsed_file(
+                file_path, [], {"error": "File too large or unreadable"}
+            )
+
+        try:
+            lines = content.split("\n")
+            dependencies = self._parse_dependencies(lines)
+
+            # Calculate statistics
+            sources = set()
+            targets = set()
+            for dep in dependencies:
+                sources.add(dep.source)
+                targets.add(dep.target)
+
+            metadata = {
+                "file_size": self.get_file_size(file_path),
+                "total_dependencies": len(dependencies),
+                "unique_sources": len(sources),
+                "unique_targets": len(targets),
+                "unique_files": len(sources.union(targets)),
+            }
+
+            return self.create_parsed_file(file_path, dependencies, metadata)
+
+        except Exception as e:
+            return self.create_parsed_file(file_path, [], {"error": str(e)})
+
+    def _parse_dependencies(self, lines: List[str]) -> List[Dependency]:
+        dependencies = []
+        current_target = None
+
+        for line in lines:
+            line = line.strip()
+            if not line:
+                continue
+
+            # Handle make-style dependencies (target: source1 source2 ...)
+            if ":" in line and not line.startswith(" ") and not line.startswith("\t"):
+                parts = line.split(":", 1)
+                if len(parts) == 2:
+                    target = parts[0].strip()
+                    sources = parts[1].strip()
+                    current_target = target
+
+                    if sources:
+                        for source in sources.split():
+                            source = source.strip()
+                            if source and source != "\\":
+                                dependencies.append(
+                                    Dependency(
+                                        source=source, target=target, type="dependency"
+                                    )
+                                )
+
+            # Handle continuation lines
+            elif (line.startswith(" ") or line.startswith("\t")) and current_target:
+                sources = line.strip()
+                for source in sources.split():
+                    source = source.strip()
+                    if source and source != "\\":
+                        dependencies.append(
+                            Dependency(
+                                source=source, target=current_target, type="dependency"
+                            )
+                        )
+
+            # Handle simple dependency lists (one per line)
+            elif "->" in line or "=>" in line:
+                if "->" in line:
+                    parts = line.split("->", 1)
+                else:
+                    parts = line.split("=>", 1)
+
+                if len(parts) == 2:
+                    source = parts[0].strip()
+                    target = parts[1].strip()
+                    dependencies.append(
+                        Dependency(source=source, target=target, type="dependency")
+                    )
+
+            # Reset current target for new sections
+            elif not line.startswith(" ") and not line.startswith("\t"):
+                current_target = None
+
+        return dependencies
@@ -0,0 +1,91 @@
+# ===----------------------------------------------------------------------===//
+#
+# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+# See https://llvm.org/LICENSE.txt for license information.
+# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+#
+# ===----------------------------------------------------------------------===//
+
+import re
+from typing import Dict, List, Any
+from .base_parser import BaseParser
+from ..models import FileType, ParsedFile, Dependency
+
+
+class IncludeTreeParser(BaseParser):
+    def __init__(self):
+        super().__init__(FileType.INCLUDE_TREE)
+        self.include_pattern = re.compile(r"^(\s*)(\S+)\s*(?:\(([^)]+)\))?")
+
+    def parse(self, file_path: str) -> ParsedFile:
+        content = self.read_file_safe(file_path)
+        if content is None:
+            return self.create_parsed_file(
+                file_path, [], {"error": "File too large or unreadable"}
+            )
+
+        try:
+            lines = content.split("\n")
+            include_data = self._parse_include_tree(lines)
+
+            metadata = {
+                "file_size": self.get_file_size(file_path),
+                "total_includes": len(include_data["dependencies"]),
+                "unique_files": len(include_data["files"]),
+                "max_depth": include_data["max_depth"],
+            }
+
+            return self.create_parsed_file(file_path, include_data, metadata)
+
+        except Exception as e:
+            return self.create_parsed_file(file_path, [], {"error": str(e)})
+
+    def _parse_include_tree(self, lines: List[str]) -> Dict[str, Any]:
+        include_data = {"dependencies": [], "files": set(), "tree": [], "max_depth": 0}
+
+        stack = []  # Stack to track parent files
+
+        for line in lines:
+            if not line.strip():
+                continue
+
+            match = self.include_pattern.match(line)
+            if match:
+                indent = len(match.group(1))
+                file_path = match.group(2)
+                extra_info = match.group(3)
+
+                depth = indent // 2  # Assuming 2 spaces per indent level
+                include_data["max_depth"] = max(include_data["max_depth"], depth)
+
+                # Adjust stack based on current depth
+                while len(stack) > depth:
+                    stack.pop()
+
+                # Add to files set
+                include_data["files"].add(file_path)
+
+                # Create dependency relationship
+                if stack:
+                    parent = stack[-1]
+                    dependency = Dependency(
+                        source=parent, target=file_path, type="include"
+                    )
+                    include_data["dependencies"].append(dependency)
+
+                # Add tree entry
+                tree_entry = {
+                    "file": file_path,
+                    "depth": depth,
+                    "parent": stack[-1] if stack else None,
+                    "extra_info": extra_info,
+                }
+                include_data["tree"].append(tree_entry)
+
+                # Push current file onto stack
+                stack.append(file_path)
+
+        # Convert set to list for JSON serialization
+        include_data["files"] = list(include_data["files"])
+
+        return include_data