codeflaws and whitebox
This commit is contained in:
@@ -0,0 +1,183 @@
|
||||
import bugzoo
|
||||
from bugzoo import server, Container
|
||||
import csv
|
||||
import os
|
||||
from common.commons import *
|
||||
DATA_PATH = os.environ["DATA_PATH"]
|
||||
ROOT_DIR = os.environ["ROOT_DIR"]
|
||||
DATASET = os.environ["dataset"]
|
||||
COCCI_PATH = join(os.environ["coccinelle"],'spatch')
|
||||
def patchSourceFile(bugPath,spfile,bugName):
|
||||
# print(bugPath)
|
||||
# srcName = bugPath.split('/')[-1].split('-')[0]
|
||||
srcPath = bugPath
|
||||
patchName = bugName
|
||||
|
||||
|
||||
|
||||
if(isfile(join(DATA_PATH,"codeflaws",bugName,'patched',patchName+spfile+'.c'))):
|
||||
return join(DATA_PATH,"codeflaws",bugName,'patched',patchName+spfile+'.c')
|
||||
|
||||
if not (isfile(join(DATA_PATH,"codeflaws",bugName,'patches',patchName+spfile+'.txt'))):
|
||||
cmd = COCCI_PATH + ' --sp-file ' + join(DATASET, 'cocci', spfile) + ' ' + srcPath + ' --patch -o' + join(
|
||||
DATA_PATH, "codeflaws", bugName, 'patches', patchName) + ' > ' + join(DATA_PATH, "codeflaws", bugName,
|
||||
'patches',
|
||||
patchName + spfile + '.txt')
|
||||
|
||||
output, e = shellGitCheckout(cmd)
|
||||
# logging.info(output)
|
||||
patchSize = os.path.getsize(join(DATA_PATH,"codeflaws",bugName,'patches',patchName+spfile+'.txt'))
|
||||
if patchSize == 0 :
|
||||
# os.remove(join(DATA_PATH,"introclass",bugName,'patches',patchName+spfile+'.txt'))
|
||||
return None
|
||||
else:
|
||||
|
||||
cmd = 'patch -d '+'/'.join(srcPath.split('/')[:-1])+' -i '+join(DATA_PATH,"codeflaws",bugName,'patches',patchName+spfile+'.txt')+' -o '+join(DATA_PATH,"codeflaws",bugName,'patched',patchName+spfile+'.c')
|
||||
o,e = shellGitCheckout(cmd)
|
||||
return join(DATA_PATH, "codeflaws", bugName, 'patched', patchName + spfile + '.c')
|
||||
|
||||
|
||||
def readTestSuite(testPath):
|
||||
regex = r"([p|n0-9]+)\)"
|
||||
with open(testPath,mode='r') as testFile:
|
||||
test_str = testFile.read()
|
||||
matches = re.finditer(regex, test_str, re.MULTILINE)
|
||||
|
||||
testList = []
|
||||
for matchNum, match in enumerate(matches, start=1):
|
||||
|
||||
for groupNum in range(0, len(match.groups())):
|
||||
groupNum = groupNum + 1
|
||||
testList.append(match.group(groupNum))
|
||||
return testList
|
||||
|
||||
def test_all(testerPath,validTests):
|
||||
test_outcomes = {} # type: Dict[TestCase, TestOutcome]
|
||||
failure_cases = []
|
||||
failure = 0
|
||||
total = len(validTests)
|
||||
for test in validTests:
|
||||
# if test.name in validTests:
|
||||
cmd ='bash ' + testerPath + ' {}'.format(test)
|
||||
out,e = shellGitCheckout(cmd)
|
||||
# out = client.containers.exec(container=container, command=cmd, context='/experiment/')
|
||||
|
||||
if 'Accepted' not in out or e != '':
|
||||
failure += 1
|
||||
failure_cases.append(test)
|
||||
# test_outcomes.append(out.output)
|
||||
break
|
||||
|
||||
# test_outcomes[test] = client.containers.test(container, test)
|
||||
# if test.expected_outcome != test_outcomes[test].passed:
|
||||
# if test_outcomes[test].passed != True:
|
||||
# failure.append(test.name)
|
||||
# failure_cases.append(test.command)
|
||||
# break
|
||||
return failure_cases, failure, total
|
||||
|
||||
def validateCore(bugName):
|
||||
|
||||
if not os.path.exists(join(DATA_PATH, 'codeflaws', bugName, 'patches')):
|
||||
os.makedirs(join(DATA_PATH, 'codeflaws', bugName, 'patches'))
|
||||
if not os.path.exists(join(join(DATA_PATH, 'codeflaws', bugName, 'patched'))):
|
||||
os.makedirs(join(DATA_PATH, 'codeflaws', bugName, 'patched'))
|
||||
|
||||
fix = 'failure'
|
||||
output = ''
|
||||
# print("bugName: {}".format(bugName), end=' ')
|
||||
output += 'bugName:' + bugName + ', '
|
||||
|
||||
# spfiles = listdir(join(DATASET, 'cocci'))
|
||||
spfiles = load_zipped_pickle(join(DATA_PATH, 'uniquePatterns.pickle'))
|
||||
|
||||
spfiles['uProjects'] = spfiles.uFiles.apply(lambda x: list(set([i.split('/{')[0].replace('(','') for i in x])))
|
||||
spfiles[~spfiles.uProjects.apply(lambda x: np.all([i == 'codeflaws' for i in x]))]
|
||||
spfiles = spfiles[['uid']]
|
||||
|
||||
|
||||
cmd = 'make -C ' + join(DATA_PATH, 'codeflaws', bugName) + ' clean'
|
||||
o, e = shellGitCheckout(cmd)
|
||||
# print("patching... " + bugName)
|
||||
|
||||
contestid, problem, _, buggyId, acceptedId = bugName.split('-')
|
||||
|
||||
|
||||
# for idx, spfile in enumerate(spfiles):
|
||||
for idx, spfile in enumerate(spfiles.uid.values.tolist()):
|
||||
if spfile == '.DS_Store':
|
||||
continue
|
||||
|
||||
# originalBugs = get_filepaths(join(DATA_PATH, 'manybugs', bugName, 'diffs'), preId)
|
||||
buggyFileName = contestid+'-'+problem+'-'+buggyId+'.c'
|
||||
path = join(DATA_PATH,'codeflaws',bugName,buggyFileName)
|
||||
patch = patchSourceFile(path, spfile, bugName)
|
||||
|
||||
times = 0
|
||||
if patch is None:
|
||||
continue
|
||||
|
||||
shutil.copy2(patch,join(DATA_PATH, 'codeflaws', bugName))
|
||||
|
||||
cmd = 'make -C ' + join(DATA_PATH, 'codeflaws', bugName) + ' FILENAME=' + bugName + spfile
|
||||
o, e = shellGitCheckout(cmd)
|
||||
|
||||
|
||||
# patch_result = output
|
||||
# TODO logic
|
||||
# if patch_result.successful:
|
||||
if isfile(join(DATA_PATH,'codeflaws',bugName,bugName+spfile)):
|
||||
|
||||
output += '@True:' + str(idx) + ':' + patch.split('/')[-1] + '@'
|
||||
|
||||
validTests = readTestSuite(join(DATA_PATH, 'codeflaws', bugName, 'test-valid.sh'))
|
||||
post_failure_cases, post_failure, total = test_all(join(DATA_PATH, 'codeflaws', bugName, 'test-valid.sh'), validTests)
|
||||
|
||||
# print("{}".format(post_failure), end=' ')
|
||||
output += str(post_failure) + ' '
|
||||
if post_failure == 0:
|
||||
times += 1
|
||||
fix = 'success'
|
||||
# print("fix {} by {}".format(bugName, patch_name))
|
||||
output += 'fix {} by {} '.format(bugName, patch)
|
||||
break
|
||||
# print("@fail:{}@total:{}".format(post_failure, total),end=' ')
|
||||
# print("@post_failure_cases:{}".format(post_failure_cases))
|
||||
|
||||
# cmd = 'docker rm -fv {}'.format(container.id)
|
||||
# out, e = shellGitCheckout(cmd)
|
||||
|
||||
output += 'times:{}, '.format(times) + fix
|
||||
print(output)
|
||||
return output
|
||||
|
||||
# failure_cases, failure, total, test_outcomes = test_all(bug, container, client)
|
||||
# if failure == 0:
|
||||
# fix = 'success'
|
||||
# # print("fix {} by {}".format(bugName, patch_name))
|
||||
# output += 'fix {} by {} '.format(bugName, patch)
|
||||
# break
|
||||
# else:
|
||||
# output += ' {}'.format(failure_cases)
|
||||
# else:
|
||||
# output += '@False:' + str(idx) + ':' + patch.split('/')[-1] + '@'
|
||||
# output += 'times:{}, '.format(times) + fix
|
||||
#
|
||||
# return output
|
||||
|
||||
def validate():
|
||||
bugs2test= listdir(join(DATA_PATH, 'codeflaws'))
|
||||
|
||||
bugList = []
|
||||
for b in bugs2test:
|
||||
if b == '.DS_Store' or b == 'README.md' or b == 'codeflaws-defect-detail-info.txt':
|
||||
continue
|
||||
bugList.append(b)
|
||||
|
||||
# results = parallelRunMerge(testCore, bugList,max_workers=10)
|
||||
results = parallelRunMerge(validateCore, bugList)
|
||||
print('\n'.join(results))
|
||||
with open(join(DATA_PATH, 'codeFlawsResults'), 'w',
|
||||
encoding='utf-8') as writeFile:
|
||||
writeFile.write('\n'.join(results))
|
||||
validateCore(b)
|
||||
Reference in New Issue
Block a user