updating pr_data again

This commit is contained in:
Matthew Gaughan 2024-03-14 08:31:11 -05:00
parent 954486d5c2
commit d8433ae18d

View File

@ -15,7 +15,7 @@ early_cutoff = dt.datetime(2008,2, 8)
temp_dir = "/data/users/mgaughan/tmp"
'''
- rate of change, rate of PRs/day
- rate of change, rate of all/day
'''
def file_get_pr(upstream_vcs_link, me_read):
# if we're looking at readmes me_read is true and if not, if we're looking at contributing files, it's false
@ -76,7 +76,7 @@ def file_get_pr(upstream_vcs_link, me_read):
project_dict['first_readme'] = first_date_readme
before_read = pr_count(first_date_readme+ dt.timedelta(days=-window, hours=0), first_date_readme, commit_list, [], [])
if before_read != None:
project_dict['before_prs_read'] = before_read[0]
project_dict['before_allcom_read'] = before_read[0]
project_dict['before_mrg_read'] = before_read[1]
project_dict['before_auth_new'] = before_read[2]
project_dict['before_commit_new'] = before_read[3]
@ -84,7 +84,7 @@ def file_get_pr(upstream_vcs_link, me_read):
return {}
after_read = pr_count(first_date_readme, first_date_readme + dt.timedelta(days=window, hours=0), commit_list, before_read[4], before_read[5])
if after_read != None:
project_dict['after_prs_read'] = after_read[0]
project_dict['after_allcom_read'] = after_read[0]
project_dict['after_mrg_read'] = after_read[1]
project_dict['after_auth_new'] = after_read[2]
project_dict['after_commit_new'] = after_read[3]
@ -94,7 +94,7 @@ def file_get_pr(upstream_vcs_link, me_read):
project_dict['first_contributing'] = first_date_contributing
before_cont = pr_count(first_date_contributing + dt.timedelta(days=-window, hours=0), first_date_contributing, commit_list, [], [])
if before_cont != None:
project_dict['before_prs_cont'] = before_cont[0]
project_dict['before_allcom_cont'] = before_cont[0]
project_dict['before_mrg_cont'] = before_cont[1]
project_dict['before_auth_new'] = before_cont[2]
project_dict['before_commit_new'] = before_cont[3]
@ -102,7 +102,7 @@ def file_get_pr(upstream_vcs_link, me_read):
return {}
after_cont = pr_count(first_date_contributing, first_date_contributing + dt.timedelta(days=window, hours=0), commit_list, before_cont[4], before_cont[5])
if after_cont != None:
project_dict['after_prs_cont'] = after_cont[0]
project_dict['after_allcom_cont'] = after_cont[0]
project_dict['after_mrg_cont'] = after_cont[1]
project_dict['after_auth_new'] = after_cont[2]
project_dict['after_commit_new'] = after_cont[3]
@ -150,7 +150,7 @@ def for_files():
csv_reader = csv.DictReader(file)
with open('kk_test_031424_pr_did.csv', "w") as writing_file:
# this would also have to get switched fro the cont dataset
keys = ['upstream_vcs_link', "first_readme", "before_prs_read", "before_mrg_read", "after_prs_read", "after_mrg_read", 'before_auth_new', 'after_commit_new', 'after_auth_new', 'before_commit_new']
keys = ['upstream_vcs_link', "first_readme", "before_allcom_read", "before_mrg_read", "after_allcom_read", "after_mrg_read", 'before_auth_new', 'after_commit_new', 'after_auth_new', 'before_commit_new']
dict_writer = csv.DictWriter(writing_file, keys)
dict_writer.writeheader()
for row in csv_reader: