Professional Documents
Culture Documents
Implementation of Page Rank
Implementation of Page Rank
import networkx as nx
D = nx.DiGraph()
for i in range(n):
nx.draw(D, with_labels=True)
plt.show()
Implementation Association Mining like Apriori using languages like Java/ Python.
Code:
data = []
for i in range(n):
arr = []
data.append([i, arr])
init = []
for i in data:
for q in i[1]:
init.append(q)
init = sorted(init)
print(init)
s = int(sp*len(init))
c = Counter()
for i in init:
for d in data:
if(i in d[1]):
c[i]+=1
print("\nC1:")
for i in c:
print(str([i])+": "+str(c[i]))
print()
l = Counter()
for i in c:
l[frozenset([i])]+=c[i]
print("L1:")
for i in l:
print(str(list(i))+": "+str(l[i]))
print()
pl = l
pos = 1
for count in range (2,1000):
if(len(l) == 1):
break
nc = set()
temp = list(l)
for i in range(0,len(temp)):
for j in range(i+1,len(temp)):
t = temp[i].union(temp[j])
if(len(t) == count):
nc.add(temp[i].union(temp[j]))
nc = list(nc)
c = Counter()
for i in nc:
c[i] = 0
for q in data:
temp = set(q[1])
if(i.issubset(temp)):
c[i]+=1
print("C"+str(count)+":")
for i in c:
print(str(list(i))+": "+str(c[i]))
print()
l = Counter()
for i in c:
l[i]+=c[i]
print("L"+str(count)+":")
for i in l:
print(str(list(i))+": "+str(l[i]))
print()
pl = l
pos = count
print("Result: ")
print("L"+str(pos)+":")
for i in pl:
print(str(list(i))+": "+str(pl[i]))
print()
Code -
a = len(arr1)
n = int(a / m)
arr = []
if j >= a:
break
k = int(i/3)
for j in range(3):
b1[k][j] = int(mean)
print("Smoothing by Mean:")
for i in range(3):
k = int(i/3)
for j in range(3):
b2[k][j] = arr1[i+1]
print("Smoothing by Median:")
for i in range(3):
k = int(i/3)
for j in range(3):
b3[k][j] = arr1[i]
else:
b3[k][j] = arr1[i+2]
print("Smoothing by Boundaries:")
for i in range(3):
# no of bins
m=3
print("Bins: ")
equifreq(data, m)
B] Data Visualization
import pandas as pd
data = pd.read_csv("dwm_exp8.csv")
# Scatter plot
plt.scatter(data['day'], data['tip'])
plt.title("Scatter Plot")
plt.xlabel('Day')
plt.ylabel('Tip')
plt.show()
# Histogram
plt.hist(data['total_bill'])
plt.title("Histogram")
plt.show()
Implementation of Clustering Algorithm K Means
Code -
import sys
import random
dataset = obj.split()
Dict = {}
meansOld = random.sample(dataset, k)
means = meansOld.copy()
for x in range(5):
for i in range(k):
Dict[i] = []
for i in range(len(dataset)):
minIndex = 0
minValue = sys.maxsize
for j in range(len(means)):
minIndex = j
Dict[minIndex].append(dataset[i])
sum = 0
num = 0
for i in value:
sum = sum + i
num = num + 1
means[key] = sum/num
if(meansOld == means):
break
meansOld = means.copy()
Dict.clear()