pyspark install - arcturus9/useful-link GitHub Wiki
- from Apache Spark Deep Learning Cookbook
Java 8 or higher
Anaconda
Spark
java -version
sudo apt-get install software-properties-common
$ sudo add-apt-repository ppa:webupd8team/java
$ sudo apt-get update
$ sudo apt-get install oracle-java8-installer
$ python --version
Python 3.6.1 :: Anaconda 4.4.0 (64-bit)
$ cd Downloads/
~/Downloads$ ls
spark-2.2.0-bin-hadoop2.7.tgz
~/Downloads$ tar -zxvf spark-2.2.0-bin-hadoop2.7.tgz
~/Downloads$ ls
spark-2.2.0-bin-hadoop2.7 spark-2.2.0-bin-hadoop2.7.tgz
~/Downloads$ mv spark-2.2.0-bin-hadoop2.7 ~/
~/Downloads$ ls
spark-2.2.0-bin-hadoop2.7.tgz
~/Downloads$ cd
~$ ls
anaconda3 Downloads Pictures Templates
Desktop examples.desktop Public Videos
Documents Music spark-2.2.0-bin-hadoop2.7
~$ cd ~/spark-2.2.0-bin-hadoop2.7/
~/spark-2.2.0-bin-hadoop2.7$ ./bin/pyspark
>>> sc
<SparkContext master=local[*] appName=PySparkShell>
$ nano .bashrc
function sparknotebook()
{
export SPARK_HOME=/home/asherif844/spark-2.2.0-bin-hadoop2.7
export PYSPARK_PYTHON=python3
export PYSPARK_DRIVER_PYTHON=jupyter
export PYSPARK_DRIVER_PYTHON_OPTS="notebook"
$SPARK_HOME/bin/pyspark
}
$ source .bashrc
$ sparknotebook
< Examples >
-
Learning PySpark (in Packthub)
https://github.com/drabastomek/learningPySpark -
Apache Spark DeepLearning Cookbook
https://github.com/asherif844/ApacheSparkDeepLearningCookbook