Professional Documents
Culture Documents
vertices =
sqlContext.read.format("com.databricks.spark.csv").options(header='true',
inferschema='true').load("file:///home/cloudera/Downloads/vertices_file.csv")
edges = sqlContext.read.format("com.databricks.spark.csv").options(header='true',
inferschema='true').load("file:///home/cloudera/Downloads/edges_file.csv")
edges.registerTempTable("edges")
vertices.registerTempTable("vertices")
g.vertices.show()
g.edges.show()
g.inDegrees.show()
g.outDegrees.show()
g.degrees.show()
exp = g.vertices.groupBy("Experience")
exp.count().show()
motifs = g.find("(a)-[e]->(b)")
motifs.count().show()
result = g.labelPropagation(maxIter=5)
result.show()
results = g.pageRank(resetProbability=0.15, tol=0.01)
results.vertices.show()
results.edges.show()
rank = g.pageRank(resetProbability=0.15, maxIter=5)
ranks.vertices.orderBy(ranks.vertices.pagerank.desc()).limit(10).show()