macey
By: a guest | Feb 9th, 2010 | Syntax:
Python | Size: 1.13 KB | Hits: 16 | Expires: Never
def sortData(fileName):
rawData = open(fileName+'.txt')
a =[]
z = 0
for l in rawData:
a.append([])
a[z]= range(20)
for i in range(20):
a[z][i]=0
x = l.split()
for i in x:
a[z][int(i)] = a[z][int(i)]+1
z = z+1
return a
#print sortData("U2Fans")
def toBernoulli(data):
a = []
for i in range(len(data)):
if data[i] == 0:
a.append(0)
else:
a.append(1)
return a
#note: fanData will come from a list sortData("AllListeners")
def probVector(sortedData):
a = [float(0)]*20
l = float(len(sortedData))
b = []
for fan in sortedData:
b.append(toBernoulli(fan))
for j in range(20):
for x in b:
a[j] = a[j] + (float(x[j])/l)
return a
#for u in sortData("U2Fans"):
# print toBernoulli(u)
print probVector(sortData("U2Fans"))
def fanType(fanData):
a = sortData("U2Fans")
b = sortData("ColdplayFans")
c = sortData("GirlsAloudFans")
for i in range(len(a)):
a[i] = toBernoulli(a[i])
for j in range(len(b)):
b[j] = toBernoulli(b[i])
for k in range(len(c)):
c[k] = toBernoulli(c[k])
fanData = toBernoulli(fanData)