hopefully a bit more specificity on this

This commit is contained in:
mjgaughan 2023-11-08 11:10:27 -06:00
parent 268ca229a2
commit 3ffe07572b

61
main.py
View File

@ -60,35 +60,23 @@ def get_everything(manifest_path, early_cutoff):
#print(vcs_path) return #print(vcs_path) return
try: try:
repo_path = vcs_path[0] repo_path = vcs_path[0]
largest_object[repo_path] = {}
largest_object[repo_path]["perceval_obj"] = pt.main(vcs_path, early_cutoff)
if len(largest_object[repo_path]["perceval_obj"]) == 0:
print("PERCEVAL ERROR")
del largest_object[repo_path]
return
largest_object[repo_path]["gha_obj"] = gha.main(vcs_path, early_cutoff)
'''
if largest_object[repo_path]["gha_obj"]['milestone_count'] == 0:
#del largest_object[repo_path]
#return
#this is to ensure that projects which don't use milestones are counted
largest_object[repo_path]["gha_obj"]['milestone_count'] = 0.1
largest_object[repo_path]['new_mmt'] = compute_new_mmt(largest_object[repo_path]["perceval_obj"]['contributors'], largest_object[repo_path]["perceval_obj"]['collaborators'])
#print('New MMT: ' + str(largest_object[repo_path]['new_mmt']))
largest_object[repo_path]['old_mmt'] = compute_old_mmt(largest_object[repo_path]["perceval_obj"]['contributors'], largest_object[repo_path]["perceval_obj"]['collaborators'])
#print('Old MMT: ' + str(largest_object[repo_path]['old_mmt']))
#new mmt formality score
largest_object[repo_path]['new_formality'] = compute_formality_score(largest_object[repo_path]['new_mmt'], largest_object[repo_path]["gha_obj"]['milestone_count'], largest_object[repo_path]["perceval_obj"]['age_of_project'])
print(largest_object[repo_path]['new_formality'])
'''
# testing out beneath:
largest_object[repo_path]['ghs_obj'] = ghs.main(vcs_path, early_cutoff)
#print(ghs_obj["time_cleaned_comm"])
repo_uri_list = repo_path.split('/')
with open('/data/users/mgaughan/kkex_data_110823_1/' + repo_uri_list[-2] + '_' + repo_uri_list[-1] + '_result.json', 'w') as data_path:
json.dump(largest_object[repo_path], data_path)
except: except:
print("miscellanea error in the main body") print('vcs error')
return
largest_object[repo_path] = {}
largest_object[repo_path]["perceval_obj"] = pt.main(vcs_path, early_cutoff)
if len(largest_object[repo_path]["perceval_obj"]) == 0:
print("PERCEVAL ERROR")
del largest_object[repo_path]
return
largest_object[repo_path]["gha_obj"] = gha.main(vcs_path, early_cutoff)
# testing out beneath:
largest_object[repo_path]['ghs_obj'] = ghs.main(vcs_path, early_cutoff)
#print(ghs_obj["time_cleaned_comm"])
repo_uri_list = repo_path.split('/')
with open('/data/users/mgaughan/kkex_data_110823_1/' + repo_uri_list[-2] + '_' + repo_uri_list[-1] + '_result.json', 'w') as data_path:
json.dump(largest_object[repo_path], data_path)
except yaml.YAMLError as err: except yaml.YAMLError as err:
print(err) print(err)
print("----------------------") print("----------------------")
@ -108,3 +96,20 @@ def compute_formality_score(mmt, milestones, lifetime):
if __name__ == "__main__": if __name__ == "__main__":
main() main()
'''
if largest_object[repo_path]["gha_obj"]['milestone_count'] == 0:
#del largest_object[repo_path]
#return
#this is to ensure that projects which don't use milestones are counted
largest_object[repo_path]["gha_obj"]['milestone_count'] = 0.1
largest_object[repo_path]['new_mmt'] = compute_new_mmt(largest_object[repo_path]["perceval_obj"]['contributors'], largest_object[repo_path]["perceval_obj"]['collaborators'])
#print('New MMT: ' + str(largest_object[repo_path]['new_mmt']))
largest_object[repo_path]['old_mmt'] = compute_old_mmt(largest_object[repo_path]["perceval_obj"]['contributors'], largest_object[repo_path]["perceval_obj"]['collaborators'])
#print('Old MMT: ' + str(largest_object[repo_path]['old_mmt']))
#new mmt formality score
largest_object[repo_path]['new_formality'] = compute_formality_score(largest_object[repo_path]['new_mmt'], largest_object[repo_path]["gha_obj"]['milestone_count'], largest_object[repo_path]["perceval_obj"]['age_of_project'])
print(largest_object[repo_path]['new_formality'])
'''