feat: Initial MVP of admissions control

4 years ago · 76ba308c16
parent abfb9b18e4
commit 76ba308c16
5 changed files with 81 additions and 3 deletions
--- a/runtime/include/runtime.h
+++ b/runtime/include/runtime.h
@ -29,6 +29,18 @@ extern float runtime_processor_speed_MHz;
 extern pthread_t runtime_worker_threads[];
 extern uint32_t  runtime_worker_threads_count;
 /*
 * Unitless estimate of the instantaneous fraction of system capacity required to complete all previously
 * admitted work. This is used to calculate free capacity as part of admissions control
 *
 * The estimated requirements of a single admitted request is calculated as
 * estimated execution time (cycles) / relative deadline (cycles)
 *
 * These estimates are incremented on request acceptance and decremented on request completion (either
 * success or failure)
 */
 extern double runtime_admitted;
 void         alloc_linear_memory(void);
 void         expand_memory(void);
 INLINE char *get_function_from_table(uint32_t idx, uint32_t type_id);
--- a/runtime/include/sandbox.h
+++ b/runtime/include/sandbox.h
@ -81,6 +81,12 @@ struct sandbox {
 	uint64_t absolute_deadline;
 	uint64_t total_time; /* From Request to Response */
 	/*
 	 * Unitless estimate of the instantaneous fraction of system capacity required to run the request
 	 * Calculated by estimated execution time (cycles) / relative deadline (cycles)
 	 */
 	double admissions_estimate;
 	struct module *module; /* the module this is an instance of */
 	int32_t arguments_offset; /* actual placement of arguments in the sandbox. */
--- a/runtime/include/sandbox_request.h
+++ b/runtime/include/sandbox_request.h
@ -14,6 +14,12 @@ struct sandbox_request {
 	struct sockaddr *socket_address;
 	uint64_t         request_arrival_timestamp; /* cycles */
 	uint64_t         absolute_deadline;         /* cycles */
 	/*
 	 * Unitless estimate of the instantaneous fraction of system capacity required to run the request
 	 * Calculated by estimated execution time (cycles) / relative deadline (cycles)
 	 */
 	double admissions_estimate;
 };
 DEQUE_PROTOTYPE(sandbox, struct sandbox_request *);
@ -29,7 +35,8 @@ DEQUE_PROTOTYPE(sandbox, struct sandbox_request *);
 */
 static inline struct sandbox_request *
 sandbox_request_allocate(struct module *module, char *arguments, int socket_descriptor,
-                         const struct sockaddr *socket_address, uint64_t request_arrival_timestamp)
+                         const struct sockaddr *socket_address, uint64_t request_arrival_timestamp,
                         double admissions_estimate)
 {
 	struct sandbox_request *sandbox_request = (struct sandbox_request *)malloc(sizeof(struct sandbox_request));
 	assert(sandbox_request);
@ -39,6 +46,7 @@ sandbox_request_allocate(struct module *module, char *arguments, int socket_desc
 	sandbox_request->socket_address            = (struct sockaddr *)socket_address;
 	sandbox_request->request_arrival_timestamp = request_arrival_timestamp;
 	sandbox_request->absolute_deadline         = request_arrival_timestamp + module->relative_deadline;
 	sandbox_request->admissions_estimate       = admissions_estimate;
 	debuglog("Allocating %lu of %s:%d\n", sandbox_request->request_arrival_timestamp, sandbox_request->module->name,
 	         sandbox_request->module->port);
--- a/runtime/src/runtime.c
+++ b/runtime/src/runtime.c
@ -16,7 +16,8 @@
 * Shared Process State    *
 **************************/
-int runtime_epoll_file_descriptor;
+int    runtime_epoll_file_descriptor;
 double runtime_admitted;
 /******************************************
 * Shared Process / Listener Thread Logic *
@ -44,6 +45,8 @@ runtime_initialize(void)
 	/* Initialize http_parser_settings global */
 	http_parser_settings_initialize();
 	runtime_admitted = 0;
 }
 /*************************
@ -92,14 +95,45 @@ listener_thread_main(void *dummy)
 			}
 			total_requests++;
 			/* Perform Admission Control */
 			/*
 			 * TODO: Enhance to use configurable percentiles rather than just mean. This can be policy
 			 * defined in the module specification
 			 */
 			uint64_t estimated_execution = perf_window_get_mean(&module->perf_window);
 			/*
 			 * If this is the first execution, assume a default execution
 			 * TODO: Enhance module specification to provide "seed" value of estimated duration
 			 * TODO: Should we "rate limit" or only admit one request before we have actual data? Otherwise
 			 * we might be flooded with sandboxes that possibly underestimate
 			 */
 			if (estimated_execution == -1) estimated_execution = 1000;
 			double admissions_estimate = (double)estimated_execution / module->relative_deadline;
 			/*
 			 * Reject Requests that exceed system capacity
 			 * TODO: Enhance to gracefully return HTTP status code 503 Service Unavailable
 			 */
 			if (runtime_admitted + admissions_estimate >= runtime_worker_threads_count) {
 				debuglog("Would have rejected!");
 			}
 			/* Allocate a Sandbox Request */
 			struct sandbox_request *sandbox_request =
 			  sandbox_request_allocate(module, module->name, socket_descriptor,
-			                           (const struct sockaddr *)&client_address, request_arrival_timestamp);
+			                           (const struct sockaddr *)&client_address, request_arrival_timestamp,
 			                           admissions_estimate);
 			assert(sandbox_request);
 			/* Add to the Global Sandbox Request Scheduler */
 			global_request_scheduler_add(sandbox_request);
 			/* Add to work accepted by the runtime */
 			runtime_admitted += admissions_estimate;
 			debuglog("Runtime Utilization: %f%%\n", runtime_admitted / runtime_worker_threads_count * 100);
 		}
 	}
--- a/runtime/src/sandbox.c
+++ b/runtime/src/sandbox.c
@ -454,6 +454,8 @@ sandbox_set_as_initialized(struct sandbox *sandbox, struct sandbox_request *sand
 	debuglog("Sandbox %lu | Uninitialized => Initialized\n", sandbox->request_arrival_timestamp);
 	sandbox->admissions_estimate = sandbox_request->admissions_estimate;
 	sandbox->request_arrival_timestamp   = sandbox_request->request_arrival_timestamp;
 	sandbox->allocation_timestamp        = allocation_timestamp;
 	sandbox->last_state_change_timestamp = allocation_timestamp;
@ -731,6 +733,11 @@ sandbox_set_as_error(struct sandbox *sandbox, sandbox_state_t last_state)
 	sandbox_print_perf(sandbox);
 	runtime_admitted -= sandbox->admissions_estimate;
 	assert(runtime_admitted >= 0);
 	debuglog("Runtime Utilization: %f%%\n", runtime_admitted / runtime_worker_threads_count * 100);
 	/* Do not touch sandbox state after adding to the completion queue to avoid use-after-free bugs */
 	local_completion_queue_add(sandbox);
 }
@ -768,6 +775,17 @@ sandbox_set_as_complete(struct sandbox *sandbox, sandbox_state_t last_state)
 	sandbox->last_state_change_timestamp = now;
 	sandbox->state                       = SANDBOX_COMPLETE;
 	/*
 	 * TODO: Enhance to include "spinning" or better "local|global scheduling latency" as well.
 	 * Given the async I/O model of libuv, it is ambiguous how to model "spinning"
 	 */
 	perf_window_add(&sandbox->module->perf_window, sandbox->running_duration);
 	runtime_admitted -= sandbox->admissions_estimate;
 	assert(runtime_admitted >= 0);
 	debuglog("Runtime Utilization: %f%%\n", runtime_admitted / runtime_worker_threads_count * 100);
 	sandbox_print_perf(sandbox);
 	/* Do not touch sandbox state after adding to the completion queue to avoid use-after-free bugs */