Skip to content

Commit

Permalink
Initial commit.
Browse files Browse the repository at this point in the history
  • Loading branch information
eli64s committed Mar 24, 2023
0 parents commit 1288a44
Show file tree
Hide file tree
Showing 5 changed files with 71 additions and 0 deletions.
9 changes: 9 additions & 0 deletions conf/conf.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
# Configuration constants

[kafka]
KAFKA_BOOTSTRAP_SERVERS = "localhost:9092"
KAFKA_TOPIC = "my_topic"

[flink]
FLINK_JOB_MANAGER = "localhost:8081"
FLINK_PARALLELISM = 4
36 changes: 36 additions & 0 deletions conf/flink-config.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
# Flink configuration file

# JobManager configuration
jobmanager.rpc.address: localhost
jobmanager.rpc.port: 6123
jobmanager.heap.size: 1024m
jobmanager.rpc.numThreads: 8

# TaskManager configuration
taskmanager.memory.process.size: 1024m
taskmanager.memory.managed.size: 768m
taskmanager.numberOfTaskSlots: 2
taskmanager.rpc.numThreads: 8

# High Availability configuration
high-availability: zookeeper
high-availability.storageDir: hdfs://localhost:9000/flink/recovery
high-availability.zookeeper.quorum: localhost:2181
high-availability.zookeeper.path.root: /flink

# Parallelism and resource allocation
parallelism.default: 2
parallelism.max: 8
taskmanager.cpu.cores: 4

# State backend configuration
state.backend: rocksdb
state.checkpoints.dir: hdfs://localhost:9000/flink/checkpoints
state.backend.rocksdb.memory.managed: true
state.backend.rocksdb.predefined-options: FLASH_SSD_OPTIMIZED

# Logging configuration
log4j.logger.org.apache.flink: INFO,console
log4j.logger.org.apache.flink.client.cli: INFO,console
log4j.logger.org.apache.flink.runtime.rest: INFO,console
log4j.logger.org.apache.flink.runtime.rpc: INFO,console
7 changes: 7 additions & 0 deletions requirements.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
asyncio
aiohttp
aioresponses
apache-flink
apache-kafka
pandas
pyflink
10 changes: 10 additions & 0 deletions scripts/run.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
#!/bin/bash

# Start Flink cluster
flink/bin/start-cluster.sh

# Submit PyFlink job
flink/bin/flink run -py ./scripts/word_count.py

# Stop Flink cluster
flink/bin/stop-cluster.sh
9 changes: 9 additions & 0 deletions setup/setup.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
#!/bin/bash

conda create -n flink python=3.8
conda activate flink

python -m pip install apache-flink
pip install pyflink

export FLINK_CONDA_HOME=$(dirname $(dirname $CONDA_EXE))

0 comments on commit 1288a44

Please sign in to comment.