From 32aab82414949ef262cc4c74f3f21918cc8342f9 Mon Sep 17 00:00:00 2001 From: Sebastian Nagel Date: Wed, 19 May 2021 15:33:48 +0200 Subject: [PATCH] Docker-compose: expose only UI ports (HDFS namenode, YARN resource manager and history server). Internal Hadoop communication ports are reachable only from inside the cluster. Fix Docker network name in README.md - should be the same as defined by DOCKER_NETWORK in the Makefile. --- README.md | 11 ++++++----- docker-compose.yml | 5 ++++- 2 files changed, 10 insertions(+), 6 deletions(-) diff --git a/README.md b/README.md index e836e345..275b4b71 100644 --- a/README.md +++ b/README.md @@ -7,7 +7,7 @@ Version 2.0.0 introduces uses wait_for_it script for the cluster startup # Hadoop Docker ## Supported Hadoop Versions -See repository branches for supported hadoop versions +See repository branches for supported Hadoop versions ## Quick Start @@ -26,16 +26,17 @@ Or deploy in swarm: docker stack deploy -c docker-compose-v3.yml hadoop ``` -`docker-compose` creates a docker network that can be found by running `docker network list`, e.g. `dockerhadoop_default`. +`docker-compose` creates a docker network that can be found by running `docker network list`, e.g. `docker-hadoop_default`. -Run `docker network inspect` on the network (e.g. `dockerhadoop_default`) to find the IP the hadoop interfaces are published on. Access these interfaces with the following URLs: +Run `docker network inspect` on the network (e.g. `docker-hadoop_default`) to find the IP the Hadoop interfaces are published on. Access these interfaces with the following URLs: * Namenode: http://:9870/dfshealth.html#tab-overview * History server: http://:8188/applicationhistory -* Datanode: http://:9864/ -* Nodemanager: http://:8042/node * Resource manager: http://:8088/ +All other Hadoop communication ports are not exposed and only accessible from inside the Docker network using service name and port, eg. `http://namenode:9000/`. + + ## Configure Environment Variables The configuration parameters can be specified in the hadoop.env file or as environmental variables for specific services (e.g. namenode, datanode etc.): diff --git a/docker-compose.yml b/docker-compose.yml index ed40dc62..4864fd39 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -7,7 +7,6 @@ services: restart: always ports: - 9870:9870 - - 9000:9000 volumes: - hadoop_namenode:/hadoop/dfs/name environment: @@ -30,6 +29,8 @@ services: image: bde2020/hadoop-resourcemanager:2.0.0-hadoop3.2.1-java8 container_name: resourcemanager restart: always + ports: + - 8088:8088 environment: SERVICE_PRECONDITION: "namenode:9000 namenode:9870 datanode:9864" env_file: @@ -48,6 +49,8 @@ services: image: bde2020/hadoop-historyserver:2.0.0-hadoop3.2.1-java8 container_name: historyserver restart: always + ports: + - 8188:8188 environment: SERVICE_PRECONDITION: "namenode:9000 namenode:9870 datanode:9864 resourcemanager:8088" volumes: