sledge/runtime/experiments/concurrency/run.sh

#!/bin/bash

# This experiment is intended to document how the level of concurrent requests influence the latency, throughput, and success/failure rate

# Add bash_libraries directory to path
__run_sh__base_path="$(dirname "$(realpath --logical "${BASH_SOURCE[0]}")")"
__run_sh__bash_libraries_relative_path="../bash_libraries"
__run_sh__bash_libraries_absolute_path=$(cd "$__run_sh__base_path" && cd "$__run_sh__bash_libraries_relative_path" && pwd)
export PATH="$__run_sh__bash_libraries_absolute_path:$PATH"

source csv_to_dat.sh || exit 1
source framework.sh || exit 1
source generate_gnuplots.sh || exit 1
source get_result_count.sh || exit 1
source panic.sh || exit 1
source path_join.sh || exit 1

if ! command -v hey > /dev/null; then
	echo "hey is not present."
	exit 1
fi

declare -gi iterations=10000
declare -ga concurrency=(1 20 40 60 80 100)

run_samples() {
	if (($# != 1)); then
		panic "invalid number of arguments \"$1\""
		return 1
	elif [[ -z "$1" ]]; then
		panic "hostname \"$1\" was empty"
		return 1
	fi

	local hostname="$1"

	# Scrape the perf window size from the source if possible
	# TODO: Make a util function
	local -r perf_window_path="$(path_join "$__run_sh__base_path" ../../include/perf_window.h)"
	local -i perf_window_buffer_size
	if ! perf_window_buffer_size=$(grep "#define PERF_WINDOW_BUFFER_SIZE" < "$perf_window_path" | cut -d\  -f3); then
		printf "Failed to scrape PERF_WINDOW_BUFFER_SIZE from ../../include/perf_window.h\n"
		printf "Defaulting to 16\n"
		perf_window_buffer_size=16
	fi
	local -ir perf_window_buffer_size

	printf "Running Samples: "
	hey -n "$perf_window_buffer_size" -c "$perf_window_buffer_size" -q 200 -cpus 3 -o csv -m GET "http://${hostname}:10000" 1> /dev/null 2> /dev/null || {
		printf "[ERR]\n"
		panic "samples failed"
		return 1
	}

	printf "[OK]\n"
	return 0
}

# Execute the experiments
# $1 (hostname)
# $2 (results_directory) - a directory where we will store our results
run_experiments() {
	if (($# != 2)); then
		panic "invalid number of arguments \"$1\""
		return 1
	elif [[ -z "$1" ]]; then
		panic "hostname \"$1\" was empty"
		return 1
	elif [[ ! -d "$2" ]]; then
		panic "directory \"$2\" does not exist"
		return 1
	fi

	local hostname="$1"
	local results_directory="$2"

	# Execute the experiments
	printf "Running Experiments:\n"
	for conn in ${concurrency[*]}; do
		printf "\t%d Concurrency: " "$conn"
		hey -n "$iterations" -c "$conn" -cpus 2 -o csv -m GET "http://$hostname:10000" > "$results_directory/con$conn.csv" 2> /dev/null || {
			printf "[ERR]\n"
			panic "experiment failed"
			return 1
		}
		get_result_count "$results_directory/con$conn.csv" || {
			printf "[ERR]\n"
			panic "con$conn.csv unexpectedly has zero requests"
			return 1
		}
		printf "[OK]\n"
	done

	return 0
}

process_results() {
	if (($# != 1)); then
		panic "invalid number of arguments ($#, expected 1)"
		return 1
	elif ! [[ -d "$1" ]]; then
		panic "directory $1 does not exist"
		return 1
	fi

	local -r results_directory="$1"

	printf "Processing Results: "

	# Write headers to CSVs
	printf "Concurrency,Success_Rate\n" >> "$results_directory/success.csv"
	printf "Concurrency,Throughput\n" >> "$results_directory/throughput.csv"
	printf "Con,p50,p90,p99,p100\n" >> "$results_directory/latency.csv"

	for conn in ${concurrency[*]}; do

		if [[ ! -f "$results_directory/con$conn.csv" ]]; then
			printf "[ERR]\n"
			panic "Missing $results_directory/con$conn.csv"
			return 1
		fi

		# Calculate Success Rate for csv (percent of requests resulting in 200)
		awk -F, '
		$7 == 200 {ok++}
		END{printf "'"$conn"',%3.5f\n", (ok / '"$iterations"' * 100)}
	' < "$results_directory/con$conn.csv" >> "$results_directory/success.csv"

		# Filter on 200s, convert from s to ms, and sort
		awk -F, '$7 == 200 {print ($1 * 1000)}' < "$results_directory/con$conn.csv" \
			| sort -g > "$results_directory/con$conn-response.csv"

		# Get Number of 200s
		oks=$(wc -l < "$results_directory/con$conn-response.csv")
		((oks == 0)) && continue # If all errors, skip line

		# We determine duration by looking at the timestamp of the last complete request
		# TODO: Should this instead just use the client-side synthetic duration_sec value?
		duration=$(tail -n1 "$results_directory/con$conn.csv" | cut -d, -f8)

		# Throughput is calculated as the mean number of successful requests per second
		throughput=$(echo "$oks/$duration" | bc)
		printf "%d,%f\n" "$conn" "$throughput" >> "$results_directory/throughput.csv"

		# Generate Latency Data for csv
		awk '
		BEGIN {
			sum = 0
			p50 = int('"$oks"' * 0.5)
			p90 = int('"$oks"' * 0.9)
			p99 = int('"$oks"' * 0.99)
			p100 = '"$oks"'
			printf "'"$conn"',"
		}
		NR==p50 {printf "%1.4f,", $0}
		NR==p90 {printf "%1.4f,", $0}
		NR==p99 {printf "%1.4f,", $0}
		NR==p100 {printf "%1.4f\n", $0}
	' < "$results_directory/con$conn-response.csv" >> "$results_directory/latency.csv"

		# Delete scratch file used for sorting/counting
		rm -rf "$results_directory/con$conn-response.csv"
	done

	# Transform csvs to dat files for gnuplot
	csv_to_dat "$results_directory/success.csv" "$results_directory/throughput.csv" "$results_directory/latency.csv"

	# Generate gnuplots
	generate_gnuplots "$results_directory" "$__run_sh__base_path" || {
		printf "[ERR]\n"
		panic "failed to generate gnuplots"
	}

	printf "[OK]\n"
	return 0
}

# Expected Symbol used by the framework
experiment_main() {
	local -r target_hostname="$1"
	local -r results_directory="$2"

	run_samples "$target_hostname" || return 1
	run_experiments "$target_hostname" "$results_directory" || return 1
	process_results "$results_directory" || return 1

	return 0
}

main "$@"
test: add concurrency experiment 4 years ago			`#!/bin/bash`

			`# This experiment is intended to document how the level of concurrent requests influence the latency, throughput, and success/failure rate`

refactor: concurrency and payload use framework 4 years ago			`# Add bash_libraries directory to path`
			`__run_sh__base_path="$(dirname "$(realpath --logical "${BASH_SOURCE[0]}")")"`
			`__run_sh__bash_libraries_relative_path="../bash_libraries"`
			`__run_sh__bash_libraries_absolute_path=$(cd "$__run_sh__base_path" && cd "$__run_sh__bash_libraries_relative_path" && pwd)`
			`export PATH="$__run_sh__bash_libraries_absolute_path:$PATH"`

			`source csv_to_dat.sh \|\| exit 1`
			`source framework.sh \|\| exit 1`
			`source generate_gnuplots.sh \|\| exit 1`
			`source get_result_count.sh \|\| exit 1`
			`source panic.sh \|\| exit 1`
			`source path_join.sh \|\| exit 1`

chore: make command check silent 4 years ago			`if ! command -v hey > /dev/null; then`
chore: Install hey if needed 4 years ago			`echo "hey is not present."`
			`exit 1`
			`fi`

test: centralize bimodal and refactor concurrency 4 years ago			`declare -gi iterations=10000`
			`declare -ga concurrency=(1 20 40 60 80 100)`

			`run_samples() {`
refactor: concurrency and payload use framework 4 years ago			`if (($# != 1)); then`
			`panic "invalid number of arguments \"$1\""`
			`return 1`
			`elif [[ -z "$1" ]]; then`
			`panic "hostname \"$1\" was empty"`
			`return 1`
			`fi`

			`local hostname="$1"`
test: centralize bimodal and refactor concurrency 4 years ago
			`# Scrape the perf window size from the source if possible`
refactor: concurrency and payload use framework 4 years ago			`# TODO: Make a util function`
			`local -r perf_window_path="$(path_join "$__run_sh__base_path" ../../include/perf_window.h)"`
test: centralize bimodal and refactor concurrency 4 years ago			`local -i perf_window_buffer_size`
			`if ! perf_window_buffer_size=$(grep "#define PERF_WINDOW_BUFFER_SIZE" < "$perf_window_path" \| cut -d\ -f3); then`
refactor: concurrency and payload use framework 4 years ago			`printf "Failed to scrape PERF_WINDOW_BUFFER_SIZE from ../../include/perf_window.h\n"`
			`printf "Defaulting to 16\n"`
test: centralize bimodal and refactor concurrency 4 years ago			`perf_window_buffer_size=16`
			`fi`
			`local -ir perf_window_buffer_size`

			`printf "Running Samples: "`
			`hey -n "$perf_window_buffer_size" -c "$perf_window_buffer_size" -q 200 -cpus 3 -o csv -m GET "http://${hostname}:10000" 1> /dev/null 2> /dev/null \|\| {`
			`printf "[ERR]\n"`
refactor: concurrency and payload use framework 4 years ago			`panic "samples failed"`
test: centralize bimodal and refactor concurrency 4 years ago			`return 1`
			`}`

refactor: concurrency and payload use framework 4 years ago			`printf "[OK]\n"`
test: centralize bimodal and refactor concurrency 4 years ago			`return 0`
			`}`
test: add concurrency experiment 4 years ago
			`# Execute the experiments`
refactor: concurrency and payload use framework 4 years ago			`# $1 (hostname)`
			`# $2 (results_directory) - a directory where we will store our results`
test: centralize bimodal and refactor concurrency 4 years ago			`run_experiments() {`
refactor: concurrency and payload use framework 4 years ago			`if (($# != 2)); then`
			`panic "invalid number of arguments \"$1\""`
test: centralize bimodal and refactor concurrency 4 years ago			`return 1`
refactor: concurrency and payload use framework 4 years ago			`elif [[ -z "$1" ]]; then`
			`panic "hostname \"$1\" was empty"`
			`return 1`
			`elif [[ ! -d "$2" ]]; then`
			`panic "directory \"$2\" does not exist"`
test: centralize bimodal and refactor concurrency 4 years ago			`return 1`
			`fi`

refactor: concurrency and payload use framework 4 years ago			`local hostname="$1"`
			`local results_directory="$2"`
test: centralize bimodal and refactor concurrency 4 years ago
			`# Execute the experiments`
refactor: concurrency and payload use framework 4 years ago			`printf "Running Experiments:\n"`
test: centralize bimodal and refactor concurrency 4 years ago			`for conn in ${concurrency[*]}; do`
			`printf "\t%d Concurrency: " "$conn"`
refactor: concurrency and payload use framework 4 years ago			`hey -n "$iterations" -c "$conn" -cpus 2 -o csv -m GET "http://$hostname:10000" > "$results_directory/con$conn.csv" 2> /dev/null \|\| {`
			`printf "[ERR]\n"`
			`panic "experiment failed"`
			`return 1`
			`}`
			`get_result_count "$results_directory/con$conn.csv" \|\| {`
			`printf "[ERR]\n"`
			`panic "con$conn.csv unexpectedly has zero requests"`
			`return 1`
			`}`
			`printf "[OK]\n"`
test: centralize bimodal and refactor concurrency 4 years ago			`done`
refactor: concurrency and payload use framework 4 years ago
			`return 0`
test: centralize bimodal and refactor concurrency 4 years ago			`}`

			`process_results() {`
			`if (($# != 1)); then`
refactor: concurrency and payload use framework 4 years ago			`panic "invalid number of arguments ($#, expected 1)"`
test: centralize bimodal and refactor concurrency 4 years ago			`return 1`
			`elif ! [[ -d "$1" ]]; then`
refactor: concurrency and payload use framework 4 years ago			`panic "directory $1 does not exist"`
test: centralize bimodal and refactor concurrency 4 years ago			`return 1`
			`fi`

			`local -r results_directory="$1"`

refactor: concurrency and payload use framework 4 years ago			`printf "Processing Results: "`
test: centralize bimodal and refactor concurrency 4 years ago
			`# Write headers to CSVs`
			`printf "Concurrency,Success_Rate\n" >> "$results_directory/success.csv"`
			`printf "Concurrency,Throughput\n" >> "$results_directory/throughput.csv"`
			`printf "Con,p50,p90,p99,p100\n" >> "$results_directory/latency.csv"`

			`for conn in ${concurrency[*]}; do`
refactor: concurrency and payload use framework 4 years ago
			`if [[ ! -f "$results_directory/con$conn.csv" ]]; then`
			`printf "[ERR]\n"`
			`panic "Missing $results_directory/con$conn.csv"`
			`return 1`
			`fi`

test: centralize bimodal and refactor concurrency 4 years ago			`# Calculate Success Rate for csv (percent of requests resulting in 200)`
			`awk -F, '`
chore: bash cleanup 4 years ago			`$7 == 200 {ok++}`
			`END{printf "'"$conn"',%3.5f\n", (ok / '"$iterations"' * 100)}`
			`' < "$results_directory/con$conn.csv" >> "$results_directory/success.csv"`
test: add concurrency experiment 4 years ago
test: centralize bimodal and refactor concurrency 4 years ago			`# Filter on 200s, convert from s to ms, and sort`
			`awk -F, '$7 == 200 {print ($1 * 1000)}' < "$results_directory/con$conn.csv" \`
			`\| sort -g > "$results_directory/con$conn-response.csv"`

			`# Get Number of 200s`
			`oks=$(wc -l < "$results_directory/con$conn-response.csv")`
			`((oks == 0)) && continue # If all errors, skip line`
test: add concurrency experiment 4 years ago
test: centralize bimodal and refactor concurrency 4 years ago			`# We determine duration by looking at the timestamp of the last complete request`
			`# TODO: Should this instead just use the client-side synthetic duration_sec value?`
			`duration=$(tail -n1 "$results_directory/con$conn.csv" \| cut -d, -f8)`
test: add concurrency experiment 4 years ago
test: centralize bimodal and refactor concurrency 4 years ago			`# Throughput is calculated as the mean number of successful requests per second`
			`throughput=$(echo "$oks/$duration" \| bc)`
			`printf "%d,%f\n" "$conn" "$throughput" >> "$results_directory/throughput.csv"`
test: add concurrency experiment 4 years ago
test: centralize bimodal and refactor concurrency 4 years ago			`# Generate Latency Data for csv`
			`awk '`
chore: bash cleanup 4 years ago			`BEGIN {`
			`sum = 0`
			`p50 = int('"$oks"' * 0.5)`
			`p90 = int('"$oks"' * 0.9)`
			`p99 = int('"$oks"' * 0.99)`
			`p100 = '"$oks"'`
			`printf "'"$conn"',"`
			`}`
			`NR==p50 {printf "%1.4f,", $0}`
			`NR==p90 {printf "%1.4f,", $0}`
			`NR==p99 {printf "%1.4f,", $0}`
			`NR==p100 {printf "%1.4f\n", $0}`
			`' < "$results_directory/con$conn-response.csv" >> "$results_directory/latency.csv"`
test: add concurrency experiment 4 years ago
test: centralize bimodal and refactor concurrency 4 years ago			`# Delete scratch file used for sorting/counting`
			`rm -rf "$results_directory/con$conn-response.csv"`
			`done`

			`# Transform csvs to dat files for gnuplot`
refactor: concurrency and payload use framework 4 years ago			`csv_to_dat "$results_directory/success.csv" "$results_directory/throughput.csv" "$results_directory/latency.csv"`
test: centralize bimodal and refactor concurrency 4 years ago
			`# Generate gnuplots`
refactor: concurrency and payload use framework 4 years ago			`generate_gnuplots "$results_directory" "$__run_sh__base_path" \|\| {`
			`printf "[ERR]\n"`
			`panic "failed to generate gnuplots"`
			`}`
test: add concurrency experiment 4 years ago
refactor: concurrency and payload use framework 4 years ago			`printf "[OK]\n"`
			`return 0`
			`}`

			`# Expected Symbol used by the framework`
			`experiment_main() {`
			`local -r target_hostname="$1"`
			`local -r results_directory="$2"`
test: add concurrency experiment 4 years ago
refactor: concurrency and payload use framework 4 years ago			`run_samples "$target_hostname" \|\| return 1`
			`run_experiments "$target_hostname" "$results_directory" \|\| return 1`
			`process_results "$results_directory" \|\| return 1`

			`return 0`
test: centralize bimodal and refactor concurrency 4 years ago			`}`
test: add concurrency experiment 4 years ago
test: centralize bimodal and refactor concurrency 4 years ago			`main "$@"`