2023-11-09 16:45:16 +00:00
|
|
|
import json
|
|
|
|
import os
|
|
|
|
import csv
|
2023-11-10 05:18:34 +00:00
|
|
|
import pandas
|
2023-11-09 16:45:16 +00:00
|
|
|
|
2023-11-10 05:18:34 +00:00
|
|
|
#directory = '/data/users/mgaughan/kkex_data_110823_3/'
|
2023-11-09 16:45:16 +00:00
|
|
|
|
2023-11-10 05:18:34 +00:00
|
|
|
path_to_file = 'power_data_110923_mmt.csv'
|
2023-11-09 16:45:16 +00:00
|
|
|
|
2023-11-10 05:18:34 +00:00
|
|
|
csv_1 = pandas.read_csv(path_to_file)
|
|
|
|
print(csv_1)
|
|
|
|
csv_2 = pandas.read_csv('/data_ext/users/kcz1100/kaylea_dissertation/collabnetXS/raw_data/inst_all_packages_full_results.csv')
|
|
|
|
print(csv_2['pkg'])
|
|
|
|
|
|
|
|
up_fac_mean = []
|
|
|
|
for index, row in csv_1.iterrows():
|
|
|
|
temporary_proj_name = row['repo'][:-12].split('_')[1]
|
|
|
|
proj_name = ""
|
|
|
|
if '.git' in temporary_proj_name:
|
|
|
|
proj_name = temporary_proj_name[:-4]
|
|
|
|
else:
|
|
|
|
proj_name = temporary_proj_name
|
|
|
|
row = csv_2.loc[csv_2['pkg'] == proj_name]
|
|
|
|
print(proj_name + row['pkg'])
|
|
|
|
print(row['up.fac.mean'])
|
|
|
|
up_fac_mean.append(row['up.fac.mean'])
|
|
|
|
csv_1['up.fac.mean'] = up_fac_mean
|
|
|
|
print(csv_1)
|
|
|
|
csv1.to_csv('power_data_111023_mmt_ufm.csv')
|
|
|
|
|
|
|
|
'''
|
2023-11-09 16:45:16 +00:00
|
|
|
with open('/data/users/mgaughan/power_data_110923.csv', "w") as csv_file:
|
|
|
|
csv_header = ['repo', 'age', 'contributors', 'collaborators', 'milestones']
|
|
|
|
writer = csv.writer(csv_file, delimiter=',')
|
|
|
|
writer.writerow(csv_header)
|
|
|
|
for filename in os.listdir(directory):
|
|
|
|
new_row = []
|
|
|
|
f = os.path.join(directory, filename)
|
|
|
|
if os.path.isfile(f):
|
|
|
|
print(f)
|
|
|
|
new_row.append(f.split("/")[-1])
|
|
|
|
open_f = open(f)
|
|
|
|
data = json.load(open_f)
|
|
|
|
new_row.append(data['perceval_obj']['age_of_project'])
|
|
|
|
new_row.append(data['perceval_obj']['contributors'])
|
|
|
|
new_row.append(data['perceval_obj']['collaborators'])
|
|
|
|
new_row.append(data['gha_obj']['milestone_count'])
|
2023-11-10 05:18:34 +00:00
|
|
|
writer.writerow(new_row)
|
|
|
|
'''
|