This is an automated email from the ASF dual-hosted git repository. xxyu pushed a commit to branch kylin-on-parquet-v2 in repository https://gitbox.apache.org/repos/asf/kylin.git
The following commit(s) were added to refs/heads/kylin-on-parquet-v2 by this push: new 5125ef6 HOTFIX Add missing docker file: Dockerfile_hadoop 5125ef6 is described below commit 5125ef614fd3269646bc66ffc0931e8b4a756a88 Author: Zhichao Zhang <441586...@qq.com> AuthorDate: Tue Feb 9 16:42:56 2021 +0800 HOTFIX Add missing docker file: Dockerfile_hadoop --- docker/dockerfile/standalone/Dockerfile_hadoop | 96 ++++++++++++++++++++++++++ 1 file changed, 96 insertions(+) diff --git a/docker/dockerfile/standalone/Dockerfile_hadoop b/docker/dockerfile/standalone/Dockerfile_hadoop new file mode 100644 index 0000000..8e76855 --- /dev/null +++ b/docker/dockerfile/standalone/Dockerfile_hadoop @@ -0,0 +1,96 @@ +# +# Licensed to the Apache Software Foundation (ASF) under one or more +# contributor license agreements. See the NOTICE file distributed with +# this work for additional information regarding copyright ownership. +# The ASF licenses this file to You under the Apache License, Version 2.0 +# (the "License"); you may not use this file except in compliance with +# the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# + +# Docker image with Hadoop/Spark/Hive/ZK/Kafka installed +FROM centos:6.9 + +ENV HIVE_VERSION 1.2.1 +ENV HADOOP_VERSION 2.7.0 +ENV SPARK_VERSION 2.4.6 +ENV ZK_VERSION 3.4.6 +ENV KAFKA_VERSION 1.1.1 + +ENV JAVA_HOME /home/admin/jdk1.8.0_141 +ENV MVN_HOME /home/admin/apache-maven-3.6.1 +ENV HADOOP_HOME /home/admin/hadoop-$HADOOP_VERSION +ENV HIVE_HOME /home/admin/apache-hive-$HIVE_VERSION-bin +ENV HADOOP_CONF $HADOOP_HOME/etc/hadoop +ENV HADOOP_CONF_DIR $HADOOP_HOME/etc/hadoop +ENV SPARK_HOME /home/admin/spark-$SPARK_VERSION-bin-hadoop2.7 +ENV SPARK_CONF_DIR $SPARK_HOME/conf +ENV ZK_HOME /home/admin/zookeeper-$ZK_VERSION +ENV KAFKA_HOME /home/admin/kafka_2.11-$KAFKA_VERSION +ENV PATH $PATH:$JAVA_HOME/bin:$ZK_HOME/bin:$HADOOP_HOME/bin:$HIVE_HOME/bin:$MVN_HOME/bin:$KAFKA_HOME/bin + +USER root + +WORKDIR /home/admin + +# install tools +RUN yum -y install lsof.x86_64 wget.x86_64 tar.x86_64 git.x86_64 mysql-server.x86_64 mysql.x86_64 unzip.x86_64 + +# install mvn +RUN wget https://archive.apache.org/dist/maven/maven-3/3.6.1/binaries/apache-maven-3.6.1-bin.tar.gz \ + && tar -zxvf apache-maven-3.6.1-bin.tar.gz \ + && rm -f apache-maven-3.6.1-bin.tar.gz +COPY conf/maven/settings.xml $MVN_HOME/conf/settings.xml + +# install npm +RUN curl -sL https://rpm.nodesource.com/setup_8.x | bash - \ + && yum install -y nodejs + +# setup jdk +RUN wget --no-cookies --no-check-certificate --header "Cookie: gpw_e24=http%3A%2F%2Fwww.oracle.com%2F; oraclelicense=accept-securebackup-cookie" "http://download.oracle.com/otn-pub/java/jdk/8u141-b15/336fa29ff2bb4ef291e347e091f7f4a7/jdk-8u141-linux-x64.tar.gz" \ + && tar -zxvf /home/admin/jdk-8u141-linux-x64.tar.gz \ + && rm -f /home/admin/jdk-8u141-linux-x64.tar.gz + +# setup hadoop +RUN wget https://archive.apache.org/dist/hadoop/core/hadoop-$HADOOP_VERSION/hadoop-$HADOOP_VERSION.tar.gz \ + && tar -zxvf /home/admin/hadoop-$HADOOP_VERSION.tar.gz \ + && rm -f /home/admin/hadoop-$HADOOP_VERSION.tar.gz \ + && mkdir -p /data/hadoop +COPY conf/hadoop/* $HADOOP_CONF/ + +# setup hive +RUN wget https://archive.apache.org/dist/hive/hive-$HIVE_VERSION/apache-hive-$HIVE_VERSION-bin.tar.gz \ + && tar -zxvf /home/admin/apache-hive-$HIVE_VERSION-bin.tar.gz \ + && rm -f /home/admin/apache-hive-$HIVE_VERSION-bin.tar.gz \ + && wget -P $HIVE_HOME/lib https://repo1.maven.org/maven2/mysql/mysql-connector-java/5.1.24/mysql-connector-java-5.1.24.jar +COPY conf/hive/hive-site.xml $HIVE_HOME/conf +COPY conf/hive/hive-site.xml $HADOOP_CONF/ + +# setup spark +RUN wget https://archive.apache.org/dist/spark/spark-$SPARK_VERSION/spark-$SPARK_VERSION-bin-hadoop2.7.tgz \ + && tar -zxvf /home/admin/spark-$SPARK_VERSION-bin-hadoop2.7.tgz \ + && rm -f /home/admin/spark-$SPARK_VERSION-bin-hadoop2.7.tgz \ + && cp $HIVE_HOME/conf/hive-site.xml $SPARK_HOME/conf \ + && cp $SPARK_HOME/yarn/*.jar $HADOOP_HOME/share/hadoop/yarn/lib +RUN cp $HIVE_HOME/lib/mysql-connector-java-5.1.24.jar $SPARK_HOME/jars +RUN cp $HIVE_HOME/hcatalog/share/hcatalog/hive-hcatalog-core-1.2.1.jar $SPARK_HOME/jars/ +COPY conf/spark/* $SPARK_CONF_DIR/ + +# setup kafka +RUN wget https://archive.apache.org/dist/kafka/$KAFKA_VERSION/kafka_2.11-$KAFKA_VERSION.tgz \ + && tar -zxvf /home/admin/kafka_2.11-$KAFKA_VERSION.tgz \ + && rm -f /home/admin/kafka_2.11-$KAFKA_VERSION.tgz + +# setup zk +RUN wget https://archive.apache.org/dist/zookeeper/zookeeper-$ZK_VERSION/zookeeper-$ZK_VERSION.tar.gz \ + && tar -zxvf /home/admin/zookeeper-$ZK_VERSION.tar.gz \ + && rm -f /home/admin/zookeeper-$ZK_VERSION.tar.gz \ + && mkdir -p /data/zookeeper +COPY conf/zk/zoo.cfg $ZK_HOME/conf