Graphx
Graphx
_
import org.apache.spark._
................................................................................
Creating Vertics Table ---->
-----------------------------
scala> val vertices=Array((1L, ("A")),(2L, ("B")),(3L, ("C")))
vertices: Array[(Long, String)] = Array((1,A), (2,B), (3,C))
scala> vRDD.take(1)
[Stage 0:> (0 + 0) [Stage
0:> (0 + 1)
res0: Array[(Long, String)] = Array((1,A))
................................................................................
Creating Edges TAble ------>
-------------------------------
scala> val edges=Array(Edge(1L,2L,1800),Edge(2L,3L,800),Edge(3L,1L,1400))
edges: Array[org.apache.spark.graphx.Edge[Int]] = Array(Edge(1,2,1800),
Edge(2,3,800), Edge(3,1,1400))
scala> eRDD.take(2)
res1: Array[org.apache.spark.graphx.Edge[Int]] = Array(Edge(1,2,1800),
Edge(2,3,800))
..................................................................................
scala> graph.vertices.collect.foreach(println)
(1,A)
(2,B)
(3,C)
scala> graph.edges.collect.foreach(println)
Edge(1,2,1800)
Edge(2,3,800)
Edge(3,1,1400)
..................................................................................
scala> graph.triplets.take(3).foreach(println)
((1,A),(2,B),1800)
((2,B),(3,C),800)
((3,C),(1,A),1400)
scala> f.collect()
res6: Array[(org.apache.spark.graphx.VertexId, Int)] = Array((1,1), (2,1), (3,1))
..................................................................................
scala> fv.collect()
res8: Array[(org.apache.spark.graphx.VertexId, Int)] = Array((1,1), (2,1), (3,1))
scala> totalDegrees.collect()
res9: Array[(org.apache.spark.graphx.VertexId, Int)] = Array((1,2), (2,2), (3,2))
..................................................................................
scala> graph.vertices.filter {case (id, (name, pos)) => pos == "postdoc" }.count
res0: Long = 1
scala> graph.edges.filter { case Edge(src, dst, prop) => src > dst }.count
res4: Long = 1
...................................................................................
...............................................
PAGE RANK ::>
scala> val rank = graph.pageRank(0.0001).vertices
rank: org.apache.spark.graphx.VertexRDD[Double] = VertexRDDImpl[106] at RDD at
VertexRDD.scala:57
scala> println(rank.collect().mkString("\n"))
(2,0.5037267911816329)
(3,0.8997819807481918)
(5,0.9318945636860209)
(7,1.6645966643841548)
scala> graph.vertices.collect.foreach(println)
(2,(istoica,prof))
(3,(rxin,student))
(5,(franklin,prof))
(7,(jgonzal,postdoc))
scala> graph.edges.collect.foreach(println)
Edge(3,7,collab)
Edge(5,3,advisor)
Edge(2,5,colleague)
Edge(5,7,pi)
...................................................................................
.................................