#!/bin/bash

# This experiment is intended to document how the level of concurrent requests influence the latency, throughput, and success/failure rate
# Success - The percentage of requests that complete by their deadlines
# 	TODO: Does this handle non-200s?
# Throughput - The mean number of successful requests per second
# Latency - the rount-trip resonse time (unit?) of successful requests at the p50, p90, p99, and p100 percetiles

# Add bash_libraries directory to path
__run_sh__base_path="$(dirname "$(realpath --logical "${BASH_SOURCE[0]}")")"
__run_sh__bash_libraries_relative_path="../bash_libraries"
__run_sh__bash_libraries_absolute_path=$(cd "$__run_sh__base_path" && cd "$__run_sh__bash_libraries_relative_path" && pwd)
export PATH="$__run_sh__bash_libraries_absolute_path:$PATH"

source csv_to_dat.sh || exit 1
source framework.sh || exit 1
source get_result_count.sh || exit 1
source panic.sh || exit 1
source path_join.sh || exit 1
source validate_dependencies.sh || exit 1

validate_dependencies hey jq

declare -a workloads=()
declare -A port=()

# Example of stripping off multiple suffix from variable in format string_multiple
# test="ekf_12223.23343"
# ${test%%_+([[:digit:]]).+([[:digit:]])}
declare -Ar body=(
	[ekf]="-D ./ekf/ekf_raw.dat"
	[resize]="-D ./resize/shrinking_man_large.jpg"
	[lpd]="-D ./lpd/Cars0.png"
	[cifar10]="-D ./cifar10/airplane1.bmp"
)

initialize_globals() {
	while read -r line; do
		# Read into buffer array, splitting on commas
		readarray -t -d, buffer < <(echo -n "$line")
		workload="${buffer[1]}"
		# Update workload mix structures
		workloads+=("$workload")
		port+=(["$workload"]=$(get_port "$workload"))
	done < "$__run_sh__base_path/mix.csv"
}

get_port() {
	local name="$1"
	{
		echo "["
		cat ./spec.json
		echo "]"
	} | jq ".[] | select(.name == \"$name\") | .port"
}

run_experiments() {
	if (($# != 2)); then
		panic "invalid number of arguments \"$1\""
		return 1
	elif [[ -z "$1" ]]; then
		panic "hostname \"$1\" was empty"
		return 1
	elif [[ ! -d "$2" ]]; then
		panic "directory \"$2\" does not exist"
		return 1
	fi

	local hostname="$1"
	local results_directory="$2"

	local -A floor=()
	local -A length=()
	local -i total=0

	local -a buffer=()
	local workload=""
	local -i odds=0

	# Update workload mix structures
	while read -r line; do
		# Read into buffer array, splitting on commas
		readarray -t -d, buffer < <(echo -n "$line")
		# Use human friendly names
		odds="${buffer[0]}"
		workload="${buffer[1]}"
		floor+=(["$workload"]=$total)
		length+=(["$workload"]=$odds)
		((total += odds))
	done < mix.csv

	declare -ir random_max=32767
	# Validate Workload Mix
	if ((total <= 0 || total > random_max)); then
		echo "total must be between 1 and $random_max"
		exit 1
	fi

	# TODO: Check that workload is in spec.json
	local -ir batch_size=10
	local -i batch_id=0
	local -i roll=0
	local -ir total_iterations=10000
	local -ir worker_max=5
	local pids

	printf "Running Experiments: "

	# Select a random workload using the workload mix and run command, writing output to disk
	for ((i = 0; i < total_iterations; i += batch_size)); do
		# Block waiting for a worker to finish if we are at our max
		while (($(pgrep --count hey) >= worker_max)); do
			wait -n $(pgrep hey | tr '\n' ' ')
		done
		roll=$((RANDOM % total))
		((batch_id++))
		for workload in "${workloads[@]}"; do
			if ((roll >= floor[$workload] && roll < floor[$workload] + length[$workload])); then
				workload_class=$(echo "$workload"| cut -d'_' -f 1)
				hey -disable-compression -disable-keepalive -disable-redirects -n $batch_size -c 1 -cpus 1 -t 0 -o csv -m GET ${body[$workload_class]} "http://${hostname}:${port[$workload]}" > /dev/null 2> /dev/null &
				break
			fi
		done
	done
	pids=$(pgrep hey | tr '\n' ' ')
	[[ -n $pids ]] && wait -f $pids
	printf "[OK]\n"

	return 0
}

process_results() {
	if (($# != 1)); then
		error_msg "invalid number of arguments ($#, expected 1)"
		return 1
	elif ! [[ -d "$1" ]]; then
		error_msg "directory $1 does not exist"
		return 1
	fi

	local -r results_directory="$1"

	printf "Processing Results: "

	local -a metrics=(total queued initializing runnable running blocked returned)

	local -A fields=(
		[total]=6
		[queued]=7
		[initializing]=8
		[runnable]=9
		[running]=10
		[blocked]=11
		[returned]=12
	)

	# Write headers to CSVs
	for metric in "${metrics[@]}"; do
		printf "module,p50,p90,p99,p100\n" >> "$results_directory/$metric.csv"
	done
	printf "module,p50,p90,p99,p100\n" >> "$results_directory/memalloc.csv"

	for workload in "${workloads[@]}"; do
		mkdir "$results_directory/$workload"

		# TODO: Only include Complete

		for metric in "${metrics[@]}"; do
			awk -F, '$2 == "'"$workload"'" {printf("%.0f\n", $'"${fields[$metric]}"' / $13)}' < "$results_directory/perf.log" | sort -g > "$results_directory/$workload/${metric}_sorted.csv"
			oks=$(wc -l < "$results_directory/$workload/${metric}_sorted.csv")
			((oks == 0)) && continue # If all errors, skip line
			awk '
				BEGIN {
					sum = 0
					p50 = int('"$oks"' * 0.5)
					p90 = int('"$oks"' * 0.9)
					p99 = int('"$oks"' * 0.99)
					p100 = '"$oks"'
					printf "'"$workload"',"
				}
				NR==p50  {printf "%1.0f,",  $0}
				NR==p90  {printf "%1.0f,",  $0}
				NR==p99  {printf "%1.0f,",  $0}
				NR==p100 {printf "%1.0f\n", $0}
			' < "$results_directory/$workload/${metric}_sorted.csv" >> "$results_directory/${metric}.csv"

			# Delete scratch file used for sorting/counting
			# rm -rf "$results_directory/$workload/${metric}_sorted.csv"
		done

		# Memory Allocation
		awk -F, '$2 == "'"$workload"'" {printf("%.0f\n", $14)}' < "$results_directory/perf.log" | sort -g > "$results_directory/$workload/memalloc_sorted.csv"
		oks=$(wc -l < "$results_directory/$workload/memalloc_sorted.csv")
		((oks == 0)) && continue # If all errors, skip line
		awk '
			BEGIN {
				sum = 0
				p50 = int('"$oks"' * 0.5)
				p90 = int('"$oks"' * 0.9)
				p99 = int('"$oks"' * 0.99)
				p100 = '"$oks"'
				printf "'"$workload"',"
			}
			NR==p50  {printf "%1.0f,",  $0}
			NR==p90  {printf "%1.0f,",  $0}
			NR==p99  {printf "%1.0f,",  $0}
			NR==p100 {printf "%1.0f\n", $0}
		' < "$results_directory/$workload/memalloc_sorted.csv" >> "$results_directory/memalloc.csv"

		# Delete scratch file used for sorting/counting
		# rm -rf "$results_directory/$workload/memalloc_sorted.csv"

	done

	# Transform csvs to dat files for gnuplot
	for metric in "${metrics[@]}"; do
		csv_to_dat "$results_directory/$metric.csv"
	done
	csv_to_dat "$results_directory/memalloc.csv"

	printf "[OK]\n"
	return 0
}

experiment_server_post() {
	local -r results_directory="$1"

	# Only process data if SLEDGE_SANDBOX_PERF_LOG was set when running sledgert
	if [[ -n "$SLEDGE_SANDBOX_PERF_LOG" ]]; then
		if [[ -f "$__run_sh__base_path/$SLEDGE_SANDBOX_PERF_LOG" ]]; then
			mv "$__run_sh__base_path/$SLEDGE_SANDBOX_PERF_LOG" "$results_directory/perf.log"
			process_results "$results_directory" || return 1
		else
			echo "Perf Log was set, but perf.log not found!"
		fi
	fi
}

# Client Code
# Expected Symbol used by the framework
experiment_client() {
	local -r target_hostname="$1"
	local -r results_directory="$2"

	run_experiments "$target_hostname" "$results_directory" || return 1

	return 0
}

initialize_globals
framework_init "$@"