From bef3dfc9fc22aa735b63ecafd65cc7fca78041ba Mon Sep 17 00:00:00 2001 From: Donne Martin Date: Fri, 6 Mar 2015 07:53:17 -0500 Subject: [PATCH] Added discussion on viewing the Spark application UI. --- spark/spark.ipynb | 40 ++++++++++++++++++++++++++++++++++++++-- 1 file changed, 38 insertions(+), 2 deletions(-) diff --git a/spark/spark.ipynb b/spark/spark.ipynb index fc9f00d..1035c73 100644 --- a/spark/spark.ipynb +++ b/spark/spark.ipynb @@ -1,7 +1,7 @@ { "metadata": { "name": "", - "signature": "sha256:0426fb2480e184a6d65b40b69e4601e1abb23c84cc1090d1fe0e2e98803c6220" + "signature": "sha256:4117412dc3ddca1bb16e3800a74447569b7bd2b7484113922798e4326e254940" }, "nbformat": 3, "nbformat_minor": 0, @@ -17,7 +17,8 @@ "* Python Shell\n", "* RDDs\n", "* Pair RDDs\n", - "* Running Spark on a Cluster" + "* Running Spark on a Cluster\n", + "* Viewing the Spark Application UI" ] }, { @@ -464,6 +465,41 @@ "language": "python", "metadata": {}, "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Viewing the Spark Application UI" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Every SparkContext launches a web UI, by default on port 4040, that displays useful information about the application. This includes:\n", + "\n", + "A list of scheduler stages and tasks\n", + "A summary of RDD sizes and memory usage\n", + "Environmental information.\n", + "Information about the running executors\n", + "\n", + "You can access this interface by simply opening http://:4040 in a web browser. If multiple SparkContexts are running on the same host, they will bind to successive ports beginning with 4040 (4041, 4042, etc).\n", + "\n", + "Note that this information is only available for the duration of the application by default. To view the web UI after the fact, set spark.eventLog.enabled to true before starting the application. This configures Spark to log Spark events that encode the information displayed in the UI to persisted storage.\n", + "\n", + "[Reference](http://spark.apache.org/docs/1.2.0/monitoring.html)" + ] + }, + { + "cell_type": "code", + "collapsed": false, + "input": [ + "http://localhost:4040/" + ], + "language": "python", + "metadata": {}, + "outputs": [] } ], "metadata": {}