-
Notifications
You must be signed in to change notification settings - Fork 0
/
Data.py
47 lines (42 loc) · 1.06 KB
/
Data.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
#Precurser to FOSSE.py
import pandas as pd
def counter(x):
sasafrass = {}
for element in x:
try:
sasafrass[element] = sasafrass[element] + 1
except:
sasafrass[element] = 1
return(sasafrass)
df = pd.read_csv (r'all_eggs_data.csv')
df = df.to_dict()
ls = df["owners"]
max = 0
#print(ls)
owners = []
multiman = []
users = []
for element in ls:
owners.append(ls[element])
ownersnodups = set(owners)
gravy = counter(owners)
notsolousers = 0
for x in gravy:
users.append((gravy[x],x))
if gravy[x] > 1:
notsolousers = notsolousers + 1
temp = x.split(',')
if len(temp) > 1:
multiman.append(temp)
users.sort()
for z in users:
for x in multiman:
for y in x:
if y == z[1]:
temp = z[0] + 1
z = (y,temp)
print("Number of unique users: " + str(len(ownersnodups)))
print("Number of users who only work on one project: " + str(len(ownersnodups) - notsolousers))
print("Number of users who work more than one project: " + str(notsolousers))
print("Number of projects with more than one contributor: " + str(len(multiman)))
print(users[len(users) - 1])