- Kafka, Kafka-ui
- Apache Spark
- Apache Flink
- Apache Beam
- Docker-compose
docker-compose up -d kafka zookeeper kafka-ui
Verify Kafka cluster on Kafka-ui
docker-compose up -d producer
Verify message on Kafka-ui
docker-compose up -d spark-master spark-worker
NOTE: If the docker image build is too slow (cause by slow downloading), you should download the following file
export SPARK_VERSION=3.0.2
export HADOOP_VERSION=3.2
export SPARK_HOME=/opt/spark
https://archive.apache.org/dist/spark/spark-${SPARK_VERSION}/spark-${SPARK_VERSION}-bin-hadoop${HADOOP_VERSION}.tgz
Verify Spark cluster on Spark-ui
docker exec -it spark-master /bin/sh
/opt/spark/bin/spark-submit --master spark://spark-master:7077 \ --packages org.apache.spark:spark-sql-kafka-0-10_2.12:3.0.2 \ /opt/ spark-apps/spark-consumer.py
flink-sql-connector-kafka-3.1.0-1.18.jar
docker build --tag pyflink:latest ./pyflink
docker-compose up -d taskmanager jobmanager
Verify Flink cluster on Flink-ui
docker exec -it streaming-kakfa_jobmanager_1 /bin/sh
./bin/flink run -py ./app/test-stream.py \
--jarfile ./app/external_jars/flink-sql-connector-kafka-3.1.0-1.18.jar
Verify Flink cluster on Flink-ui
python3 beam-consumer.py --runner FlinkRunner \
--bootstrap_servers localhost:9092 \
--topics hieuung \
--flink_master localhost:8081 \