-
Notifications
You must be signed in to change notification settings - Fork 47
Expand file tree
/
Copy pathanalyzer.py
More file actions
147 lines (128 loc) · 8 KB
/
analyzer.py
File metadata and controls
147 lines (128 loc) · 8 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
import os
from pathlib import Path
import subprocess
from ...entities import *
from ...entities.entity import Entity
from ...entities.file import File
from typing import Optional
from ..analyzer import AbstractAnalyzer
from multilspy import SyncLanguageServer
import tree_sitter_java as tsjava
from tree_sitter import Language, Node
from xml.etree import ElementTree
import logging
logger = logging.getLogger('code_graph')
class JavaAnalyzer(AbstractAnalyzer):
def __init__(self) -> None:
super().__init__(Language(tsjava.language()))
def add_dependencies(self, path: Path, files: list[Path]):
# if not Path("java-decompiler-engine-243.23654.153.jar").is_file():
# subprocess.run(["wget", "https://www.jetbrains.com/intellij-repository/releases/com/jetbrains/intellij/java/java-decompiler-engine/243.23654.153/java-decompiler-engine-243.23654.153.jar"])
subprocess.run(["rm", "-rf", f"{path}/temp_deps"])
pom = ElementTree.parse(str(path) + '/pom.xml')
for dependency in pom.findall('.//{http://maven.apache.org/POM/4.0.0}dependency'):
groupId = dependency.find('{http://maven.apache.org/POM/4.0.0}groupId').text.replace('.', '/')
artifactId = dependency.find('{http://maven.apache.org/POM/4.0.0}artifactId').text
version = dependency.find('{http://maven.apache.org/POM/4.0.0}version').text
# jar_path = f"{Path.home()}/.m2/repository/{groupId}/{artifactId}/{version}/{artifactId}-{version}.jar"
jar_path = f"{Path.home()}/.m2/repository/{groupId}/{artifactId}/{version}/{artifactId}-{version}-sources.jar"
os.makedirs(f"{path}/temp_deps/{artifactId}-{version}", exist_ok=True)
# subprocess.run(["java", "-jar", "java-decompiler-engine-243.23654.153.jar", "-hdc=0 -iib=1 -rsy=1 -rbr=1 -dgs=1 -din=1 -den=1 -asc=1 -bsm=1", jar_path, f"{path}/temp_deps/{artifactId}-{version}"])
subprocess.run(["cp", jar_path, f"{artifactId}-{version}.jar"], cwd=f"{path}/temp_deps/{artifactId}-{version}")
subprocess.run(["unzip", f"{artifactId}-{version}.jar"], cwd=f"{path}/temp_deps/{artifactId}-{version}")
files.extend(Path(f"{path}/temp_deps").rglob("*.java"))
def get_entity_label(self, node: Node) -> str:
if node.type == 'class_declaration':
return "Class"
elif node.type == 'interface_declaration':
return "Interface"
elif node.type == 'enum_declaration':
return "Enum"
elif node.type == 'method_declaration':
return "Method"
elif node.type == 'constructor_declaration':
return "Constructor"
raise ValueError(f"Unknown entity type: {node.type}")
def get_entity_name(self, node: Node) -> str:
if node.type in ['class_declaration', 'interface_declaration', 'enum_declaration', 'method_declaration', 'constructor_declaration']:
return node.child_by_field_name('name').text.decode('utf-8')
raise ValueError(f"Unknown entity type: {node.type}")
def get_entity_docstring(self, node: Node) -> Optional[str]:
if node.type in ['class_declaration', 'interface_declaration', 'enum_declaration', 'method_declaration', 'constructor_declaration']:
if node.prev_sibling.type == "block_comment":
return node.prev_sibling.text.decode('utf-8')
return None
raise ValueError(f"Unknown entity type: {node.type}")
def get_entity_types(self) -> list[str]:
return ['class_declaration', 'interface_declaration', 'enum_declaration', 'method_declaration', 'constructor_declaration']
def add_symbols(self, entity: Entity) -> None:
if entity.node.type == 'class_declaration':
interfaces_captures = self._captures("(super_interfaces (type_list (type_identifier) @interface))", entity.node)
if 'interface' in interfaces_captures:
for interface in interfaces_captures['interface']:
entity.add_symbol("implement_interface", interface)
base_class_captures = self._captures("(superclass (type_identifier) @base_class)", entity.node)
if 'base_class' in base_class_captures:
base_class = base_class_captures['base_class'][0]
entity.add_symbol("base_class", base_class)
elif entity.node.type == 'interface_declaration':
extends_captures = self._captures("(extends_interfaces (type_list (type_identifier) @type))?", entity.node)
if 'type' in extends_captures:
for interface in extends_captures['type']:
entity.add_symbol("extend_interface", interface)
elif entity.node.type in ['method_declaration', 'constructor_declaration']:
captures = self._captures("(method_invocation) @reference.call", entity.node)
if 'reference.call' in captures:
for caller in captures['reference.call']:
entity.add_symbol("call", caller)
if entity.node.type == 'method_declaration':
captures = self._captures("(formal_parameters (formal_parameter type: (_) @parameter))", entity.node)
if 'parameter' in captures:
for parameter in captures['parameter']:
entity.add_symbol("parameters", parameter)
entity.add_symbol("return_type", entity.node.child_by_field_name('type'))
def is_dependency(self, file_path: str) -> bool:
return ".jar" in file_path
def resolve_path(self, file_path: str, path: Path) -> str:
if ".jar" in file_path:
args = file_path.replace(".jar", "").replace(".class", ".java").split("/")
targs = "/".join(["/".join(arg.split(".")) for arg in args[2:-1]])
return f"{path}/temp_deps/{args[1]}/{targs}/{args[-1]}"
return file_path
def resolve_type(self, files: dict[Path, File], lsp: SyncLanguageServer, file_path: Path, path: Path, node: Node) -> list[Entity]:
res = []
for file, resolved_node in self.resolve(files, lsp, file_path, path, node):
type_dec = self.find_parent(resolved_node, ['class_declaration', 'interface_declaration', 'enum_declaration'])
if type_dec in file.entities:
res.append(file.entities[type_dec])
return res
def resolve_method(self, files: dict[Path, File], lsp: SyncLanguageServer, file_path: Path, path: Path, node: Node) -> list[Entity]:
res = []
for file, resolved_node in self.resolve(files, lsp, file_path, path, node.child_by_field_name('name')):
method_dec = self.find_parent(resolved_node, ['method_declaration', 'constructor_declaration', 'class_declaration', 'interface_declaration', 'enum_declaration'])
if method_dec and method_dec.type in ['class_declaration', 'interface_declaration', 'enum_declaration']:
continue
if method_dec in file.entities:
res.append(file.entities[method_dec])
return res
def resolve_symbol(self, files: dict[Path, File], lsp: SyncLanguageServer, file_path: Path, path: Path, key: str, symbol: Node) -> list[Entity]:
if key in ["implement_interface", "base_class", "extend_interface", "parameters", "return_type"]:
return self.resolve_type(files, lsp, file_path, path, symbol)
elif key in ["call"]:
return self.resolve_method(files, lsp, file_path, path, symbol)
else:
raise ValueError(f"Unknown key {key}")
def add_file_imports(self, file: File) -> None:
"""
Extract and add import statements from the file.
Java imports are not yet implemented.
"""
# TODO: Implement Java import tracking
pass
def resolve_import(self, files: dict[Path, File], lsp: SyncLanguageServer, file_path: Path, path: Path, import_node: Node) -> list[Entity]:
"""
Resolve an import statement to the entities it imports.
Java imports are not yet implemented.
"""
# TODO: Implement Java import resolution
return []