Skip to content

Commit 156aed7

Browse files
committed
update to hadoop 2.6.0
1 parent d93e369 commit 156aed7

File tree

2 files changed

+12
-12
lines changed

2 files changed

+12
-12
lines changed

Dockerfile

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,17 +1,17 @@
11
FROM sequenceiq/hadoop-docker:2.6.0
22
MAINTAINER SequenceIQ
33

4-
#support for Hadoop 2.4.0+
5-
RUN curl -s http://d3kbcqa49mib13.cloudfront.net/spark-1.4.0-bin-hadoop2.4.tgz | tar -xz -C /usr/local/
6-
RUN cd /usr/local && ln -s spark-1.4.0-bin-hadoop2.4 spark
4+
#support for Hadoop 2.6.0
5+
RUN curl -s http://d3kbcqa49mib13.cloudfront.net/spark-1.4.0-bin-hadoop2.6.tgz | tar -xz -C /usr/local/
6+
RUN cd /usr/local && ln -s spark-1.4.0-bin-hadoop2.6 spark
77
ENV SPARK_HOME /usr/local/spark
88
RUN mkdir $SPARK_HOME/yarn-remote-client
99
ADD yarn-remote-client $SPARK_HOME/yarn-remote-client
1010

11-
RUN $BOOTSTRAP && $HADOOP_PREFIX/bin/hadoop dfsadmin -safemode leave && $HADOOP_PREFIX/bin/hdfs dfs -put $SPARK_HOME-1.4.0-bin-hadoop2.4/lib /spark
11+
RUN $BOOTSTRAP && $HADOOP_PREFIX/bin/hadoop dfsadmin -safemode leave && $HADOOP_PREFIX/bin/hdfs dfs -put $SPARK_HOME-1.4.0-bin-hadoop2.6/lib /spark
1212

1313
ENV YARN_CONF_DIR $HADOOP_PREFIX/etc/hadoop
14-
ENV SPARK_JAR hdfs:///spark/spark-assembly-1.4.0-hadoop2.4.0.jar
14+
ENV SPARK_JAR hdfs:///spark/spark-assembly-1.4.0-hadoop2.6.0.jar
1515
ENV PATH $PATH:$SPARK_HOME/bin:$HADOOP_PREFIX/bin
1616
# update boot script
1717
COPY bootstrap.sh /etc/bootstrap.sh

README.md

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -15,12 +15,11 @@ docker build --rm -t sequenceiq/spark:1.4.0 .
1515
```
1616

1717
## Running the image
18+
19+
* in your /etc/hosts file add $(boot2docker ip) as host 'sandbox' to make it easier to access your sandbox UI
20+
* open UI ports when starting image
1821
```
19-
docker run -i -t -h sandbox sequenceiq/spark:1.4.0 bash
20-
```
21-
or
22-
```
23-
docker run -d -h sandbox sequenceiq/spark:1.4.0 -d
22+
docker run -it -p 8088:8088 -p 8042:8042 -p 8080:8080 -p 7077:7077 -p 6066:6066 -h sandbox sequenceiq/spark:1.4.0 bash
2423
```
2524

2625
## Versions
@@ -38,6 +37,7 @@ In yarn-client mode, the driver runs in the client process, and the application
3837

3938
```
4039
# run the spark shell
40+
# set memory limits appropriately or spark context will not be able to start
4141
spark-shell --master yarn-client --driver-memory 1g --executor-memory 1g --executor-cores 1
4242
4343
# execute the the following command which should return 1000
@@ -51,12 +51,12 @@ Estimating Pi (yarn-cluster mode):
5151

5252
```
5353
# execute the the following command which should write the "Pi is roughly 3.1418" into the logs
54-
spark-submit --class org.apache.spark.examples.SparkPi --master yarn-cluster --driver-memory 1g --executor-memory 1g --executor-cores 1 $SPARK_HOME/lib/spark-examples-1.4.0-hadoop2.4.0.jar
54+
spark-submit --class org.apache.spark.examples.SparkPi --master yarn-cluster --driver-memory 1g --executor-memory 1g --executor-cores 1 $SPARK_HOME/lib/spark-examples-1.4.0-hadoop2.6.0.jar
5555
```
5656

5757
Estimating Pi (yarn-client mode):
5858

5959
```
6060
# execute the the following command which should print the "Pi is roughly 3.1418" to the screen
61-
spark-submit --class org.apache.spark.examples.SparkPi --master yarn-client --driver-memory 1g --executor-memory 1g --executor-cores 1 $SPARK_HOME/lib/spark-examples-1.4.0-hadoop2.4.0.jar
61+
spark-submit --class org.apache.spark.examples.SparkPi --master yarn-client --driver-memory 1g --executor-memory 1g --executor-cores 1 $SPARK_HOME/lib/spark-examples-1.4.0-hadoop2.6.0.jar
6262
```

0 commit comments

Comments
 (0)