mirror of
https://github.com/bspeice/kiva-dig
synced 2024-12-04 20:58:09 -05:00
Add a basic requirements file
And also easy script for running a Spark notebook
This commit is contained in:
parent
71627e160e
commit
df0132d466
2
.gitignore
vendored
2
.gitignore
vendored
@ -48,3 +48,5 @@ fabric.properties
|
|||||||
# Don't include the full snapshot ZIP since it's massive.
|
# Don't include the full snapshot ZIP since it's massive.
|
||||||
kiva_ds_json.zip
|
kiva_ds_json.zip
|
||||||
*.json
|
*.json
|
||||||
|
spark-*/
|
||||||
|
*.swp
|
||||||
|
1
requirements.txt
Normal file
1
requirements.txt
Normal file
@ -0,0 +1 @@
|
|||||||
|
py4j>=0.10.4
|
9
start_pyspark.sh
Executable file
9
start_pyspark.sh
Executable file
@ -0,0 +1,9 @@
|
|||||||
|
SPARK_DIR="spark-2.0.1-bin-hadoop2.7"
|
||||||
|
SPARK_URL="http://apache.claz.org/spark/spark-2.0.1/spark-2.0.1-bin-hadoop2.7.tgz"
|
||||||
|
|
||||||
|
if [ ! -d "$SPARK_DIR" ]; then
|
||||||
|
echo "Downloading Spark distribution..."
|
||||||
|
wget "$SPARK_URL" -O - | tar xzf -
|
||||||
|
fi
|
||||||
|
|
||||||
|
PYSPARK_DRIVER_PYTHON="jupyter" PYSPARK_DRIVER_PYTHON_OPTS="notebook" "./$SPARK_DIR/bin/pyspark"
|
Loading…
Reference in New Issue
Block a user