#!/usr/bin/env bash ################################################################################ # Licensed to the Apache Software Foundation (ASF) under one # or more contributor license agreements. See the NOTICE file # distributed with this work for additional information # regarding copyright ownership. The ASF licenses this file # to you under the Apache License, Version 2.0 (the # "License"); you may not use this file except in compliance # with the License. You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. ################################################################################ source "$(dirname "$0")"/common.sh CHECKPOINT_DIR="file://$TEST_DATA_DIR/savepoint-e2e-test-chckpt-dir" TEST=flink-heavy-deployment-stress-test TEST_PROGRAM_NAME=HeavyDeploymentStressTestProgram TEST_PROGRAM_JAR=${END_TO_END_DIR}/$TEST/target/$TEST_PROGRAM_NAME.jar set_config_key "pekko.ask.timeout" "60 s" set_config_key "web.timeout" "60000" set_config_key "taskmanager.memory.process.size" "1024m" # 1024Mb x 5TMs = 5Gb total heap set_config_key "taskmanager.memory.managed.size" "8" # 8Mb set_config_key "taskmanager.memory.network.min" "128mb" set_config_key "taskmanager.memory.network.max" "128mb" set_config_key "taskmanager.network.request-backoff.max" "60000" set_config_key "taskmanager.memory.segment-size" "8kb" set_config_key "taskmanager.memory.jvm-metaspace.size" "64m" set_config_key "taskmanager.memory.framework.off-heap.size" "200m" set_config_key "taskmanager.numberOfTaskSlots" "20" # 20 slots per TM start_cluster # this also starts 1TM start_taskmanagers 4 # 1TM + 4TM = 5TM a 20 slots = 100 slots # This call will result in a deployment with state meta data of 100 x 100 x 40 union states x each 40 entries. # We can scale up the numbers to make the test even heavier. $FLINK_DIR/bin/flink run ${TEST_PROGRAM_JAR} \ --environment.max_parallelism 1024 --environment.parallelism 100 \ --environment.restart_strategy fixed_delay --environment.restart_strategy.fixed_delay.attempts 3 \ --state_backend.checkpoint_directory ${CHECKPOINT_DIR} \ --heavy_deployment_test.num_list_states_per_op 40 --heavy_deployment_test.num_partitions_per_list_state 40