-
Notifications
You must be signed in to change notification settings - Fork 20
/
Copy pathgetAllEntities.py
executable file
·135 lines (112 loc) · 3.77 KB
/
getAllEntities.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
#! /usr/bin/env python3
# -*- coding: utf-8 -*-
'''
Created on 2020-08-09
@author: mingo
@module:
'''
import os
import csv
import json
import re
from tqdm import tqdm
def clean_entity_name(s):
re_entity = re.compile(r'@B_\S+_E@')
entities = re_entity.findall(s)
if entities:
entity = s[3:-3].replace('#', '.')
return entity[:] if entity[0] != '.' else entity[1:]
else:
result = s
if '<' in result:
k = result.find('<')
result = result[0:k]
if '(' in result:
k = result.find('(')
result = result[0:k]
result = result.replace('[]', '')
if '#' in result:
k1 = result.find('#')
result = result[k1+1:]
return result
def clean_method(method):
method = method.replace('.<init>', '.init')
return method
def get_package_name_from_class(class_name):
for i, c in enumerate(class_name):
if c.isupper():
return class_name[0:i-1]
def get_class_name_from_method(method_name):
split_method = method_name.split('.')
split_method.reverse()
for i, part in enumerate(split_method):
if part[0].isupper():
class_start = i
class_part = split_method[class_start: ]
class_part.reverse()
class_name = '.'.join(class_part)
return class_name
def get_package_name_from_method(method_name):
for i, c in enumerate(method_name):
if c.isupper():
return method_name[0:i-1]
def getEntities(json_path, all_entities):
if not os.path.exists(json_path):
return
data = json.load(open(json_path))
class_name = clean_entity_name(data['ClassName'])
package_name = get_package_name_from_class(class_name)
if class_name:
all_entities[class_name] = entity_type['class']
if package_name:
all_entities[package_name] = entity_type['package']
for method in data['Functions']:
method_name = class_name + '.' + method[0:method.find('(')]
all_entities[method_name] = entity_type['method']
def loadPermissionsExternal(all_entities):
permissions_path = 'res/all_permissions.txt'
with open(permissions_path) as f:
for line in f:
permission = line.strip()
if permission:
all_entities[permission] = entity_type['permission']
def loadEntitiesInExternal(all_entites):
external_file_path = 'res/extra_permission_relations.txt'
with open(external_file_path) as f:
for line in f:
temp = line.strip().split(' ')
method_name = clean_method(temp[0])
all_entites[method_name] = entity_type['method']
def printEntitiesInfo(all_entites):
count_entities = {}
for t,v in entity_type.items():
count_entities[v] = 0
for entity in all_entites:
count_entities[all_entites[entity]] += 1
print('=========== entities =============')
for t,v in entity_type.items():
print('%s: %d' % (t, count_entities[v]))
def getAllEntities():
global entity_type
entity_type = {
'package':1,
'class':2,
'method':3,
'permission':4
}
all_entities = {}
doc_json_dir = 'res/API_docs_in_json'
json_files = os.listdir(doc_json_dir)
for j_f in tqdm(json_files):
j_f_path = os.path.join(doc_json_dir, j_f)
getEntities(j_f_path, all_entities)
loadPermissionsExternal(all_entities)
loadEntitiesInExternal(all_entities)
save_entities = [[entity, all_entities[entity]] for entity in all_entities]
save_entities.sort(key = lambda x:x[1])
with open('res/entities.txt','w',newline='') as f:
writer = csv.writer(f)
writer.writerows(save_entities)
printEntitiesInfo(all_entities)
if __name__ == "__main__":
getAllEntities()