"A" "B" "C" "D" "E" "F" "G" 'G' 'A' 'A' 'G' 'B' 'A' 'C' 'A' 'A' 'C' 'A' 'D' 'E' 'A' 'F' 'A' 'B' 'D' 'D' 'F' "Red"

In
[2]: import matplotlib.pyplot as plt
import networkx as nx
import pandas as pd
import scipy as scipy
In [3]: G = nx.DiGraph()
[G.add_node(k) for k in ["A", "B", "C", "D", "E", "F", "G"]]
G.add_edges_from([('G','A'), ('A','G'),('B','A'),
('C','A'),('A','C'),('A','D'),
('E','A'),('F','A'),('B','D'),
('D','F')])
pos = nx.spiral_layout(G)
nx.draw(G, pos, with_labels = True, node_color="red")
In [4]: pr1 = nx.pagerank(G)
print(pr1)
nx.draw(G, pos, nodelist=list(pr1.keys()), node_size=[round(v * 4000) for v in pr1.value

with_labels = True, node_color="red")
{'A': 0.40001520046189115, 'B': 0.021428571428571432, 'C': 0.1347663991011727, 'D': 0.14

387354195831553, 'E': 0.021428571428571432, 'F': 0.1437213165203047, 'G': 0.134766399101
1727}
Loading [MathJax]/jax/output/CommonHTML/fonts/TeX/fontdata.js
In [5]: pr_09 = nx.pagerank(G, alpha=0.9)
pr_08 = nx.pagerank(G, alpha=0.8)
res = pd.DataFrame({"alpha=0.9": pr_09, "alpha=0.8": pr_08})
res
Out[5]: alpha=0.9 alpha=0.8
A 0.409777 0.389972
B 0.014286 0.028571
C 0.137218 0.132564
D 0.143647 0.143993
E 0.014286 0.028571
F 0.143568 0.143765
G 0.137218 0.132564
In [6]: pr_e = nx.pagerank(G, alpha=0.9, personalization={'E': 1})
print(pr_e)
nx.draw(G, pos, nodelist=list(pr_e.keys()), node_size=[round(v * 4000) for v in pr_e.val

with_labels = True, node_color="red")
{'A': 0.4147475495142858, 'B': 0.0, 'C': 0.12442358835485172, 'D': 0.12442358835485172,

'E': 0.09999999999999998, 'F': 0.11198168542115904, 'G': 0.12442358835485172}
In [8]: import urllib.request
import shutil
import zipfile
import os
filename='ml-100k'
data_url='https://files.grouplens.org/datasets/movielens/ml-100k.zip'
with urllib.request.urlopen(data_url) as response, open('./'+filename, 'wb') as out_file

shutil.copyfileobj(response, out_file)
print('Download completed')
with zipfile.ZipFile('./'+filename, 'r') as zip_ref:
zip_ref.extractall('./sample_data/')
dirs = [x[0] for x in os.walk("./sample_data")]
ml = filter(lambda dirName: dirName if ('ml' in dirName) else '', list(dirs))
dt_dir_name= list(ml)[0]
rdata = pd.read_csv(dt_dir_name +'/'+ 'u.data', delimiter='\t', names=['userId', 'movieI

rdata['userId'] = 'u' + rdata['userId'].astype(str)
rdata['movieId'] = 'i' + rdata['movieId'].astype(str)
usrdata = pd.read_csv(dt_dir_name +'/'+'u.user', delimiter='|', names=['user id', 'age'

item_data = pd.read_csv(dt_dir_name +'/'+ 'u.item', delimiter='|', encoding="ISO-8859-1"
item_data = item_data[[0,1]]
item_data.columns = ['movieId','movieTitle']
item_data['movieId'] = 'i' + item_data['movieId'].astype(str)
item_data = item_data.set_index('movieId')
rdata.head()
Download completed
Out[8]: userId movieId rating timestamp
0 u196 i242 3 881250949
1 u186 i302 3 891717742
2 u22 i377 1 878887116
3 u244 i51 2 880606923
4 u166 i346 1 886397596
In [10]: rdata = pd.merge(rdata, item_data, how='left', on='movieId')
rdata.head()
Out[10]: userId movieId rating timestamp movieTitle_x movieTitle_y
0 u196 i242 3 881250949 Kolya (1996) Kolya (1996)
1 u186 i302 3 891717742 L.A. Confidential (1997) L.A. Confidential (1997)
2 u22 i377 1 878887116 Heavyweights (1994) Heavyweights (1994)
3 u244 i51 2 880606923 Legends of the Fall (1994) Legends of the Fall (1994)
4 u166 i346 1 886397596 Jackie Brown (1997) Jackie Brown (1997)
In [11]: #Create a graph
G = nx.Graph()
#Add nodes
G.add_nodes_from(rdata.userId, bipartite=0)
G.add_nodes_from(rdata.movieId, bipartite=1)
#Add weights for edges
G.add_weighted_edges_from([(uId, mId,rating) for (uId, mId, rating)
in rdata[['userId', 'movieId', 'rating']].to_numpy()])
print(nx.info(G))
print(nx.is_bipartite(G))
Graph with 2625 nodes and 100000 edges
True
C:\Users\Vainavi\AppData\Local\Temp\ipykernel_2460\255363031.py:9: DeprecationWarning: i
nfo is deprecated and will be removed in version 3.0.
print(nx.info(G))
In [12]: movie_rank = nx.pagerank(G, alpha=0.85)
In [13]: def return_top_movies(movie_rank):
movie_rank = dict(sorted(movie_rank.items(), key=lambda item: item[1], reverse=True))
top_10_movies = []
for key, value in movie_rank.items():
if 'i' in key:
top_10_movies.append(key)
if len(top_10_movies) == 10:
break
return item_data.loc[top_10_movies]
In [14]: return_top_movies(movie_rank)
Out[14]: movieTitle
movieId
i50 Star Wars (1977)
i258 Contact (1997)
i100 Fargo (1996)
i181 Return of the Jedi (1983)
i286 English Patient, The (1996)
i288 Scream (1996)
i300 Air Force One (1997)
i127 Godfather, The (1972)
i1 Toy Story (1995)
i313 Titanic (1997)
In [15]: user_query = 'u196'
recommendation = nx.pagerank(G, alpha=0.85, personalization={user_query:1})
return_top_movies(recommendation)
Out[15]: movieTitle
movieId
i286 English Patient, The (1996)
i153 Fish Called Wanda, A (1988)
i8 Babe (1995)
i655 Stand by Me (1986)
i285 Secrets & Lies (1996)
i692 American President, The (1995)
i663 Being There (1979)
i67 Ace Ventura: Pet Detective (1994)
i25 Birdcage, The (1996)
i238 Raising Arizona (1987)
In [ ]:

"A" "B" "C" "D" "E" "F" "G" 'G' 'A' 'A' 'G' 'B' 'A' 'C' 'A' 'A' 'C' 'A' 'D' 'E' 'A' 'F' 'A' 'B' 'D' 'D' 'F' "Red"

Uploaded by

Document Information

Original Description:

Original Title

Copyright

Available Formats

Share this document

Share or Embed Document

Sharing Options

Did you find this document useful?

Is this content inappropriate?

Copyright:

Available Formats

"A" "B" "C" "D" "E" "F" "G" 'G' 'A' 'A' 'G' 'B' 'A' 'C' 'A' 'A' 'C' 'A' 'D' 'E' 'A' 'F' 'A' 'B' 'D' 'D' 'F' "Red"

Uploaded by

Copyright:

Available Formats

In

[2]: import matplotlib.pyplot as plt

import scipy as scipy

[G.add_node(k) for k in ["A", "B", "C", "D", "E", "F", "G"]]

nx.draw(G, pos, with_labels = True, node_color="red")

In [4]: pr1 = nx.pagerank(G)

nx.draw(G, pos, nodelist=list(pr1.keys()), node_size=[round(v * 4000) for v in pr1.value

{'A': 0.40001520046189115, 'B': 0.021428571428571432, 'C': 0.1347663991011727, 'D': 0.14

pr_08 = nx.pagerank(G, alpha=0.8)

res = pd.DataFrame({"alpha=0.9": pr_09, "alpha=0.8": pr_08})

Out[5]: alpha=0.9 alpha=0.8

In [6]: pr_e = nx.pagerank(G, alpha=0.9, personalization={'E': 1})

nx.draw(G, pos, nodelist=list(pr_e.keys()), node_size=[round(v * 4000) for v in pr_e.val

{'A': 0.4147475495142858, 'B': 0.0, 'C': 0.12442358835485172, 'D': 0.12442358835485172,

with urllib.request.urlopen(data_url) as response, open('./'+filename, 'wb') as out_file

with zipfile.ZipFile('./'+filename, 'r') as zip_ref:

ml = filter(lambda dirName: dirName if ('ml' in dirName) else '', list(dirs))

rdata = pd.read_csv(dt_dir_name +'/'+ 'u.data', delimiter='\t', names=['userId', 'movieI

rdata['movieId'] = 'i' + rdata['movieId'].astype(str)

usrdata = pd.read_csv(dt_dir_name +'/'+'u.user', delimiter='|', names=['user id', 'age'

item_data['movieId'] = 'i' + item_data['movieId'].astype(str)

0 u196 i242 3 881250949

1 u186 i302 3 891717742

2 u22 i377 1 878887116

3 u244 i51 2 880606923

4 u166 i346 1 886397596

In [10]: rdata = pd.merge(rdata, item_data, how='left', on='movieId')

Out[10]: userId movieId rating timestamp movieTitle_x movieTitle_y

0 u196 i242 3 881250949 Kolya (1996) Kolya (1996)

1 u186 i302 3 891717742 L.A. Confidential (1997) L.A. Confidential (1997)

2 u22 i377 1 878887116 Heavyweights (1994) Heavyweights (1994)

4 u166 i346 1 886397596 Jackie Brown (1997) Jackie Brown (1997)

In [11]: #Create a graph

#Add weights for edges

G.add_weighted_edges_from([(uId, mId,rating) for (uId, mId, rating)

in rdata[['userId', 'movieId', 'rating']].to_numpy()])

Graph with 2625 nodes and 100000 edges

In [12]: movie_rank = nx.pagerank(G, alpha=0.85)

In [13]: def return_top_movies(movie_rank):

movie_rank = dict(sorted(movie_rank.items(), key=lambda item: item[1], reverse=True))

for key, value in movie_rank.items():

i50 Star Wars (1977)

i258 Contact (1997)

i100 Fargo (1996)

i181 Return of the Jedi (1983)

i286 English Patient, The (1996)

i288 Scream (1996)

i300 Air Force One (1997)

i127 Godfather, The (1972)

i1 Toy Story (1995)

i313 Titanic (1997)

In [15]: user_query = 'u196'

recommendation = nx.pagerank(G, alpha=0.85, personalization={user_query:1})

i286 English Patient, The (1996)

i153 Fish Called Wanda, A (1988)

i655 Stand by Me (1986)

i285 Secrets & Lies (1996)

i692 American President, The (1995)

i663 Being There (1979)

i67 Ace Ventura: Pet Detective (1994)

i25 Birdcage, The (1996)

i238 Raising Arizona (1987)