123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179 |
- import csv
- import os
- import json
- import re
- import xlrd
- import xlwt
- def write_csv(node_list):
- with open("tmp_res.csv", "w", newline="") as file:
- csvwriter = csv.writer(file, dialect=("excel"))
-
- csvwriter.writerows(node_list)
- def walk_files(path, endpoint='.py'):
- file_list = []
- for root, dirs, files in os.walk(path):
- for file in files:
- file_path = os.path.join(root, file)
- if file_path.endswith(endpoint):
- file_list.append(open(file_path, encoding='utf-8'))
- return file_list
- def walk_files_path(path, endpoint='.py'):
- file_list = []
- for root, dirs, files in os.walk(path):
- for file in files:
- file_path = os.path.join(root, file)
- if file_path.endswith(endpoint):
- file_list.append(file_path)
- return file_list
- def load_json(json_file):
- with open(json_file, 'r') as load_f:
- load_dict = json.load(load_f)
- return load_dict
- def write_json(json_file, data):
- with open(json_file, 'w') as file:
- file.write(json.dumps(data))
- def load_location(file_path):
- wk_bk = xlrd.open_workbook(file_path)
- wk_all = wk_bk.sheet_by_index(0)
- location_list = [(location.split('/')[0].replace('.py', '').replace('.', '/') + '.py', int(location.split('/')[1]))
- for location in list(wk_all.col_values(0))[2:] if location != '']
- datatype_list = [data_type.split('/')[-1] for data_type in wk_all.col_values(1)[2:] if data_type != '']
- purpose_list = [purpose for purpose in wk_all.col_values(2)[2:] if purpose != '']
- location_dict = {}
- for i in range(len(location_list)):
- if location_list[i] in location_dict.keys():
- location_dict[location_list[i]].append((datatype_list[i], purpose_list[i]))
- else:
- location_dict[location_list[i]] = [(datatype_list[i], purpose_list[i])]
-
-
-
-
- return
- def write_to_excel(stamp, file_path):
- book = xlwt.Workbook(encoding='utf-8')
- sheet_datatype = book.add_sheet("DataType")
- sheet_purpose = book.add_sheet("Purpose")
- sheet_datatype.write(0, 0, "Location")
- sheet_datatype.write(0, 1, "DataType")
- sheet_datatype.write(0, 2, "confidence")
- sheet_datatype.write(0, 3, "Script")
- sheet_purpose.write(0, 0, "Location")
- sheet_purpose.write(0, 1, "Purpose")
- sheet_purpose.write(0, 2, "confidence")
- sheet_purpose.write(0, 3, "Script")
- i = 1
- j = 1
- for st in stamp:
- loc = st[0] + ' ' + str(st[1])
- datatype = list(set([data[0] for data in st[2] if data[0] != 'Data']))
- purpose = list(set([data[1] for data in st[2] if data[1] != 'Usage']))
- for data in datatype:
- sheet_datatype.write(i, 0, loc)
- sheet_datatype.write(i, 1, data)
- sheet_datatype.write(i, 2, 1)
- i += 1
- for pur in purpose:
- sheet_purpose.write(j, 0, loc)
- sheet_purpose.write(j, 1, pur)
- sheet_purpose.write(j, 2, 1.0 / len(purpose))
- j += 1
- book.save(file_path)
- def list_to_excel(file_path, data_type_list, purpose_list):
- book = xlwt.Workbook(encoding='utf-8')
- sheet_datatype = book.add_sheet("DataType")
- sheet_purpose = book.add_sheet("Purpose")
- sheet_datatype.write(0, 0, "Location")
- sheet_datatype.write(0, 1, "DataType")
- sheet_datatype.write(0, 2, "confidence")
- sheet_datatype.write(0, 3, "Script")
- sheet_purpose.write(0, 0, "Location")
- sheet_purpose.write(0, 1, "Purpose")
- sheet_purpose.write(0, 2, "confidence")
- sheet_purpose.write(0, 3, "Script")
- i = 1
- j = 1
- for data in data_type_list:
- sheet_datatype.write(i, 0, data[0])
- sheet_datatype.write(i, 1, data[1])
- sheet_datatype.write(i, 2, 1)
- i += 1
- for pur in purpose_list:
- sheet_purpose.write(j, 0, pur[0])
- sheet_purpose.write(j, 1, pur[1])
- sheet_purpose.write(j, 2, 1)
- j += 1
- book.save(file_path)
- def load_data_purpose_split(file_path):
- wk_bk = xlrd.open_workbook(file_path)
- wk_all = wk_bk.sheet_by_index(0)
- data_type_list = []
- purpose_list = []
- for i in range(2, wk_all.nrows):
- path = wk_all.row_values(i)[0]
- data_type = wk_all.row_values(i)[1]
- purpose = wk_all.row_values(i)[2]
- if path != '':
- path = path.replace('/', ' ').replace('.', '/').replace('/py', '.py')
- if data_type != '' and data_type != 'any':
- data_type_list.append((path, data_type.split('/')[-1]))
- if purpose != 'Usage' and purpose != '':
- purpose_list.append((path, purpose))
- return data_type_list, purpose_list
- def verify_file_list(file_list):
- for file in file_list:
- with open(file, encoding='utf-8') as f:
- content = f.read()
- if re.search(r'=[ ]*lambda[^:]*:', content):
- content_new = re.sub(r'=[ ]*lambda[^:]*:', '=', content)
- file_new = file.replace('.py', '-backup.py')
- with open(file_new, 'w', encoding='utf-8') as f_new:
- f_new.write(content_new)
- file_list.remove(file)
- file_list.append(file_new)
- return file_list
- if __name__ == '__main__':
- file_list = walk_files_path('/Users/liufan/program/PYTHON/SAP/TestProject')
- verify_file_list(file_list)
|