Merge pull request #390 from JiahaoLi2003/patch-1

Update ECL with ECE
This commit is contained in:
Chen Qian 2024-06-21 10:13:01 +08:00 committed by GitHub
commit f880570c76
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

146
ecl/ece.py Normal file
View File

@ -0,0 +1,146 @@
import os
import json
import re
import numpy as np
import argparse
point = 0.95
eliminate_threshold = 0.95
def retrieve_eliminate(directory_Path,directory_Memory,eliminated_directory):
experiences_use = []
content = []
content1 = []
experiences_total = []
usetime_total = []
exp_dict = {}
eliminated_exp = []
directories = [os.path.join(directory_Path, d) for d in os.listdir(directory_Path) if os.path.isdir(os.path.join(directory_Path, d))]
for subdir in directories:
directory = subdir
logdir = [filename for filename in os.listdir(directory) if filename.endswith(".log")]
logdir = os.path.join(directory, logdir[0])
content1 = open(logdir, "r", encoding='UTF-8').read()
pattern1 = re.compile(r'the source code MIDs is (.*?),', re.S)
experiences_sourceMIDs = re.findall(pattern1, content1)
pattern2 = re.compile(r'the target code MIDs is (.*?)\n',re.S)
experiences_targetMIDs = re.findall(pattern2, content1)
pattern3 = re.compile(r'And the (.*?) similarity is',re.S)
experiences_type = re.findall(pattern3,content1)
for i in range(0,len(experiences_sourceMIDs)):
sourceMID = experiences_sourceMIDs[i]
targetMID = experiences_targetMIDs[i]
type = experiences_type[i]
experiences_use.append((sourceMID,targetMID,type))
with open(directory_Memory) as file:
content1 = json.load(file)
new_content = []
for memorypiece in content1:
experiences = memorypiece.get("experiences")
if experiences != None:
experiences_total.extend(experiences)
for experience in experiences:
experience["use_time"] = 0
for experience in experiences_use:
for experience_t in experiences_total:
if experience[0] == experience_t["sourceMID"] and experience[1] == experience_t["targetMID"]:
experience_t["use_time"] += 1
for i,experience_t in enumerate(experiences_total):
usetime_total.append(experience_t["use_time"])
exp_dict[i] = experience_t["use_time"]
file.close()
usetime_sort = sorted(usetime_total)[::-1]
total = np.sum(usetime_sort)
for i in range(len(usetime_sort)):
if np.sum(usetime_sort[:i])/total >= point:
# print("α",i)
alpha= i
break
index=0
for k in sorted(exp_dict,key=exp_dict.__getitem__,reverse=True):
if index <= alpha:
eliminated_exp.append(experiences_total[k])
index += 1
else:
break
for memorypiece in content1:
experiences = memorypiece.get("experiences")
retrieve_eliminated_experienceList = []
if experiences != None:
for experience in experiences:
if experience in eliminated_exp:
retrieve_eliminated_experienceList.append(experience)
memorypiece["experiences"] = retrieve_eliminated_experienceList
new_content.append(memorypiece)
with open(eliminated_directory, 'w') as file:
json.dump(new_content, file)
# Quality score gain Elimination
def gain_eliminate(directory_NewMemory,eliminated_directory):
content2 = []
with open(directory_NewMemory) as file:
content2 = json.load(file)
new_content2 = []
for memorypiece in content2:
experiences = memorypiece.get("experiences")
gain_eliminated_experienceList = []
if experiences != None:
# print("origin:", len(experiences))
for experience in experiences:
valueGain = experience.get("valueGain")
# print(valueGain)
if valueGain >= eliminate_threshold:
gain_eliminated_experienceList.append(experience)
# print(len(experiences))
memorypiece["experiences"] = gain_eliminated_experienceList
new_content2.append(memorypiece)
else:
new_content2.append(memorypiece)
file.close()
with open(eliminated_directory, 'r') as file:
new_content = json.load(file)
new_content = new_content + new_content2
with open(eliminated_directory, 'w') as file:
json.dump(new_content, file)
def recount_experience(eliminated_directory):
with open(eliminated_directory, 'r') as file:
content = json.load(file)
with open(eliminated_directory, 'w') as file:
i = 0
for memorypiece in content:
memorypiece["total"] = i
i += 1
json.dump(content, file)
def main():
parser = argparse.ArgumentParser(description="Process memory with some directories.")
parser.add_argument("directory_Path", type = str, help="The directory of software")
parser.add_argument("directory_Memory", type=str, help="The directory of MemoryCards")
parser.add_argument("directory_NewMemory", type=str, help="The directory of NewMemoryCards")
parser.add_argument("eliminated_directory", type= str, help="The directory for output")
args = parser.parse_args()
retrieve_eliminate(args.directory_Path,args.directory_Memory,args.eliminated_directory)
gain_eliminate(args.directory_NewMemory,args.eliminated_directory)
recount_experience(args.eliminated_directory)
if __name__ == "__main__":
main()