From a8d3e820a994b69951c008f0c2ad469bd8b8183a Mon Sep 17 00:00:00 2001 From: arukavytsia Date: Sun, 13 Aug 2017 04:45:19 +0300 Subject: [PATCH] Fill readme --- README.md | 13 +++++++++++++ src/main/scala/graphx/GraphX.scala | 2 +- 2 files changed, 14 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index 5def09c..4a378df 100644 --- a/README.md +++ b/README.md @@ -1,2 +1,15 @@ # spark-graphx Spark 2.0 GraphX Social graph analysis + +Example of the usage Apache Spark for analysis of social graph of users - +like social network with model friend to friend but with fake user names. + +Social graph is represented in form user_id -> array of related user's ids, +file is stored in resources directory - UserGraph.txt + +Tested data is stored in resource directory - UserNames.tsv - file in +format user_id -> user_name, necessary for joining with Graph of contacts. + +Examples contains searching of: + 1) Most connected user in social graph based on graph degrees + 2) Degree of separation for single user based on [Breadth-first search](https://en.wikipedia.org/wiki/Breadth-first_search) with [Pregel](https://stanford.edu/~rezab/classes/cme323/S15/notes/lec8.pdf) diff --git a/src/main/scala/graphx/GraphX.scala b/src/main/scala/graphx/GraphX.scala index 4edea94..fcabe53 100644 --- a/src/main/scala/graphx/GraphX.scala +++ b/src/main/scala/graphx/GraphX.scala @@ -39,7 +39,7 @@ class GraphX(sc: SparkContext) { private def graph = Graph(verts, edges).cache() /** - * Find most connected user grpah.degrees + * Find most connected user graph.degrees * @param amount threshold for returning first n user * @return most connected user in social graph */