spark docker image
https://github.com/sequenceiq/docker-spark
docker run -i -t -h sandbox sequenceiq/spark /etc/bootstrap.sh –bash
cd /usr/local/spark
# run the spark shell
./bin/spark-shell --master yarn-client --driver-memory 1g --executor-memory 1g --executor-cores 1
# execute the the following command which should return 1000
scala> sc.parallelize(1 to 1000).count()