- Prerequirement:
- add 127.0.0.1 kafka in your /etc/hosts
docker build . -t beam-python
cd data-loading/tweets-file
docker run -v "`pwd`/src:/src" --rm -it --name tweets-file beam-python
- Generate tweets.json in $PWD/src
- move $PWD/src/tweets.json to /tmp
- direct-runner
mvn clean compile exec:java -Dexec.mainClass=fr.ippon.beam.demo.CountTweet -Dexec.args="--input=/tmp/tweets.json --output=/tmp/lead/tweets.csv" -Pdirect-runner
- Flink local
mvn clean compile exec:java -Dexec.mainClass=fr.ippon.beam.demo.CountTweet -Dexec.args="--input=/tmp/tweets.json --output=/tmp/lead/tweets.csv --runner=FlinkRunner" -Pflink-runner
- direct-runner
mvn clean compile exec:java -Dexec.mainClass=fr.ippon.beam.demo.TopTweet -Dexec.args="--input=/tmp/tweets.json --output=/tmp/tweets/leadboard" -Pdirect-runner
- Flink local
mvn clean compile exec:java -Dexec.mainClass=fr.ippon.beam.demo.TopTweet -Dexec.args="--input=/tmp/tweets.json --runner=FlinkRunner --output=/tmp/tweets/leadboard" -Pflink-runner
docker-compose up -d
cd data-loading/tweets-kafka
docker run -v "`pwd`/src:/src" --rm -it --add-host kafka:172.17.0.1 --name tweets-kafka beam-python
- direct-runner
mvn clean compile exec:java -Dexec.mainClass=fr.ippon.beam.demo.KafkaTopTweet -Pdirect-runner
- Flink local
mvn clean compile exec:java -Dexec.mainClass=fr.ippon.beam.demo.KafkaTopTweet -Pflink-runner