Compare commits

..

2 Commits

Author SHA1 Message Date
530f545b89 Merge branch 'amd' into arm 2024-04-02 13:46:08 +05:30
0dd01b6e0e Modify Dockerfile 2024-02-06 14:44:12 +05:30
3 changed files with 23 additions and 77 deletions

View File

@@ -36,7 +36,7 @@ COPY hdfs-site.xml $HADOOP_HOME/etc/hadoop/hdfs-site.xml
COPY mapred-site.xml $HADOOP_HOME/etc/hadoop/mapred-site.xml COPY mapred-site.xml $HADOOP_HOME/etc/hadoop/mapred-site.xml
COPY yarn-site.xml $HADOOP_HOME/etc/hadoop/yarn-site.xml COPY yarn-site.xml $HADOOP_HOME/etc/hadoop/yarn-site.xml
RUN echo "export JAVA_HOME=/usr/lib/jvm/java-8-openjdk-amd64" >> ~/.bashrc && \ RUN echo "export JAVA_HOME=/usr/lib/jvm/java-8-openjdk-arm64" >> ~/.bashrc && \
echo "export HADOOP_HOME=/usr/local/hadoop" >> ~/.bashrc && \ echo "export HADOOP_HOME=/usr/local/hadoop" >> ~/.bashrc && \
echo "export HADOOP_INSTALL=\$HADOOP_HOME" >> ~/.bashrc && \ echo "export HADOOP_INSTALL=\$HADOOP_HOME" >> ~/.bashrc && \
echo "export HADOOP_MAPRED_HOME=\$HADOOP_HOME" >> ~/.bashrc && \ echo "export HADOOP_MAPRED_HOME=\$HADOOP_HOME" >> ~/.bashrc && \
@@ -52,7 +52,7 @@ RUN echo "HDFS_NAMENODE_USER=root" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh
echo "HDFS_SECONDARYNAMENODE_USER=root" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh && \ echo "HDFS_SECONDARYNAMENODE_USER=root" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh && \
echo "YARN_NODEMANAGER_USER=root" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh && \ echo "YARN_NODEMANAGER_USER=root" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh && \
echo "YARN_RESOURCEMANAGER_USER=root" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh && \ echo "YARN_RESOURCEMANAGER_USER=root" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh && \
echo "export JAVA_HOME=/usr/lib/jvm/java-8-openjdk-amd64" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh && \ echo "export JAVA_HOME=/usr/lib/jvm/java-8-openjdk-arm64" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh && \
echo "export HADOOP_CLASSPATH+=\" \$HADOOP_HOME/lib/*.jar\"" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh echo "export HADOOP_CLASSPATH+=\" \$HADOOP_HOME/lib/*.jar\"" >> /usr/local/hadoop/etc/hadoop/hadoop-env.sh
# Install pig # Install pig
@@ -64,13 +64,13 @@ RUN wget -O pig.tar.gz https://downloads.apache.org/pig/pig-0.17.0/pig-0.17.0.ta
echo "export PIG_CLASSPATH=\$HADOOP_HOME/etc/hadoop" >> ~/.bashrc echo "export PIG_CLASSPATH=\$HADOOP_HOME/etc/hadoop" >> ~/.bashrc
# Install hbase # Install hbase
RUN wget https://apache.mirror.gtcomm.net/hbase/3.0.0-beta-1/hbase-3.0.0-beta-1-bin.tar.gz && \ RUN wget http://apache.mirror.gtcomm.net/hbase/2.5.8/hbase-2.5.8-bin.tar.gz && \
tar -xzvf hbase-3.0.0-beta-1-bin.tar.gz && \ tar -xzvf hbase-2.5.8-bin.tar.gz && \
mv hbase-3.0.0-beta-1-bin.tar.gz /usr/local/hbase && \ mv hbase-2.5.8 /usr/local/hbase && \
echo "export HBASE_HOME=/usr/local/hbase" >> ~/.bashrc && \ echo "export HBASE_HOME=/usr/local/hbase" >> ~/.bashrc && \
echo "export PATH=\$PATH:\$HBASE_HOME/bin" >> ~/.bashrc && \ echo "export PATH=\$PATH:\$HBASE_HOME/bin" >> ~/.bashrc && \
echo "export HBASE_DISABLE_HADOOP_CLASSPATH_LOOKUP=\"true\"" >> /usr/local/hbase/conf/hbase-env.sh && \ echo "export HBASE_DISABLE_HADOOP_CLASSPATH_LOOKUP=\"true\"" >> /usr/local/hbase/conf/hbase-env.sh && \
echo "JAVA_HOME=/usr/lib/jvm/java-8-openjdk-amd64/" >> /usr/local/hbase/conf/hbase-env.sh echo "JAVA_HOME=/usr/lib/jvm/java-8-openjdk-arm64/" >> /usr/local/hbase/conf/hbase-env.sh
COPY hbase-site.xml ~/hbase-site.xml COPY hbase-site.xml ~/hbase-site.xml
RUN mkdir -p /hadoop/zookeeper && \ RUN mkdir -p /hadoop/zookeeper && \

View File

@@ -1,35 +1,2 @@
# Hadoop on Docker # Hadoop on Docker
## Linux/WSL
### Installation
```bash
curl -fsSL https://bit.ly/hadock-install -o ~/hadoock && chmod +x ~/hadoock && sudo mv ~/hadoock /usr/bin/hadoock
```
if you're using WSL make sure to update it
```powershell
wsl.exe --update
```
### Usage
```bash
hadock
```
### Update
```bash
hadock --uninstall
curl -fsSL https://bit.ly/hadock-install | bash
```
#### Copying from host
```bash
dockcp /path/to/file
```
This command copies ```path/to/file``` from host to ```/home``` on your docker container
#### Running multiple instances
```bash
hadock_again
```
Use this command to open another shell in the same docker instance
### Uninstallation
```bash
hadock --uninstall
```
Check the [wiki](https://github.com/silicoflare/docker-hadoop/wiki) for a full guide to use this docker image. Check the [wiki](https://github.com/silicoflare/docker-hadoop/wiki) for a full guide to use this docker image.

55
kafka
View File

@@ -1,41 +1,20 @@
#!/bin/bash #!/bin/bash
verb="$1" verb=$1
arg="$2" arg=$2
# Check if KAFKA_HOME is set if [ $verb == "start" ]; then
if [ -z "$KAFKA_HOME" ]; then if [ $arg == "zookeeper" ]; then
echo "Error: KAFKA_HOME is not set" $KAFKA_HOME/bin/zookeeper-server-start.sh $KAFKA_HOME/config/zookeeper.properties
exit 1 elif [ $arg == "kafka" ]; then
fi $KAFKA_HOME/bin/kafka-server-start.sh $KAFKA_HOME/config/server.properties
fi
case "$verb" in elif [ $verb == "create-topic" ]; then
"start") $KAFKA_HOME/bin/kafka-topics.sh --create --topic $arg --bootstrap-server localhost:9092
if [ "$arg" == "zookeeper" ]; then elif [ $verb == "produce" ]; then
"$KAFKA_HOME/bin/zookeeper-server-start.sh" "$KAFKA_HOME/config/zookeeper.properties" & $KAFKA_HOME/bin/kafka-console-producer.sh --topic $arg --bootstrap-server localhost:9092
elif [ "$arg" == "kafka" ]; then elif [ $verb == "consume" ]; then
"$KAFKA_HOME/bin/kafka-server-start.sh" "$KAFKA_HOME/config/server.properties" & $KAFKA_HOME/bin/kafka-console-consumer.sh --topic $arg --from-beginning --bootstrap-server localhost:9092
else elif [ $verb == "submit" ]; then
echo "Error: Invalid argument for 'start'. Use 'zookeeper' or 'kafka'." spark-submit --packages org.apache.spark:spark-sql-kafka-0-10_2.12:3.0.1 $arg
fi fi
;;
"create-topic")
"$KAFKA_HOME/bin/kafka-topics.sh" --create --topic "$arg" --bootstrap-server localhost:9092 &
;;
"produce")
"$KAFKA_HOME/bin/kafka-console-producer.sh" --topic "$arg" --bootstrap-server localhost:9092 &
;;
"consume")
"$KAFKA_HOME/bin/kafka-console-consumer.sh" --topic "$arg" --from-beginning --bootstrap-server localhost:9092 &
;;
"submit")
if [ -z "$arg" ]; then
echo "Error: Please provide a Spark script."
else
spark-submit --packages org.apache.spark:spark-sql-kafka-0-10_2.12:3.0.1 "$arg" &
fi
;;
*)
echo "Error: Unknown verb. Use 'start', 'create-topic', 'produce', 'consume', or 'submit'."
;;
esac