feat: Initial MVP of admissions control

4 years ago · 76ba308c16
parent abfb9b18e4
commit 76ba308c16
5 changed files with 81 additions and 3 deletions
--- a/runtime/include/runtime.h
+++ b/runtime/include/runtime.h
@ -29,6 +29,18 @@ extern float runtime_processor_speed_MHz;
 extern pthread_t runtime_worker_threads[];
 extern uint32_t  runtime_worker_threads_count;

+/*
+ * Unitless estimate of the instantaneous fraction of system capacity required to complete all previously
+ * admitted work. This is used to calculate free capacity as part of admissions control
+ *
+ * The estimated requirements of a single admitted request is calculated as
+ * estimated execution time (cycles) / relative deadline (cycles)
+ *
+ * These estimates are incremented on request acceptance and decremented on request completion (either
+ * success or failure)
+ */
+extern double runtime_admitted;
+
 void         alloc_linear_memory(void);
 void         expand_memory(void);
 INLINE char *get_function_from_table(uint32_t idx, uint32_t type_id);
--- a/runtime/include/sandbox.h
+++ b/runtime/include/sandbox.h
@ -81,6 +81,12 @@ struct sandbox {
 	uint64_t absolute_deadline;
 	uint64_t total_time; /* From Request to Response */

+	/*
+	 * Unitless estimate of the instantaneous fraction of system capacity required to run the request
+	 * Calculated by estimated execution time (cycles) / relative deadline (cycles)
+	 */
+	double admissions_estimate;
+
 	struct module *module; /* the module this is an instance of */

 	int32_t arguments_offset; /* actual placement of arguments in the sandbox. */
--- a/runtime/include/sandbox_request.h
+++ b/runtime/include/sandbox_request.h
@ -14,6 +14,12 @@ struct sandbox_request {
 	struct sockaddr *socket_address;
 	uint64_t         request_arrival_timestamp; /* cycles */
 	uint64_t         absolute_deadline;         /* cycles */
+
+	/*
+	 * Unitless estimate of the instantaneous fraction of system capacity required to run the request
+	 * Calculated by estimated execution time (cycles) / relative deadline (cycles)
+	 */
+	double admissions_estimate;
 };

 DEQUE_PROTOTYPE(sandbox, struct sandbox_request *);
@ -29,7 +35,8 @@ DEQUE_PROTOTYPE(sandbox, struct sandbox_request *);
 */
 static inline struct sandbox_request *
 sandbox_request_allocate(struct module *module, char *arguments, int socket_descriptor,
-                         const struct sockaddr *socket_address, uint64_t request_arrival_timestamp)
+                         const struct sockaddr *socket_address, uint64_t request_arrival_timestamp,
+                         double admissions_estimate)
 {
 	struct sandbox_request *sandbox_request = (struct sandbox_request *)malloc(sizeof(struct sandbox_request));
 	assert(sandbox_request);
@ -39,6 +46,7 @@ sandbox_request_allocate(struct module *module, char *arguments, int socket_desc
 	sandbox_request->socket_address            = (struct sockaddr *)socket_address;
 	sandbox_request->request_arrival_timestamp = request_arrival_timestamp;
 	sandbox_request->absolute_deadline         = request_arrival_timestamp + module->relative_deadline;
+	sandbox_request->admissions_estimate       = admissions_estimate;

 	debuglog("Allocating %lu of %s:%d\n", sandbox_request->request_arrival_timestamp, sandbox_request->module->name,
 	         sandbox_request->module->port);
--- a/runtime/src/runtime.c
+++ b/runtime/src/runtime.c
@ -16,7 +16,8 @@
 * Shared Process State    *
 **************************/

-int runtime_epoll_file_descriptor;
+int    runtime_epoll_file_descriptor;
+double runtime_admitted;

 /******************************************
 * Shared Process / Listener Thread Logic *
@ -44,6 +45,8 @@ runtime_initialize(void)

 	/* Initialize http_parser_settings global */
 	http_parser_settings_initialize();
+
+	runtime_admitted = 0;
 }

 /*************************
@ -92,14 +95,45 @@ listener_thread_main(void *dummy)
 			}
 			total_requests++;

+			/* Perform Admission Control */
+
+			/*
+			 * TODO: Enhance to use configurable percentiles rather than just mean. This can be policy
+			 * defined in the module specification
+			 */
+			uint64_t estimated_execution = perf_window_get_mean(&module->perf_window);
+
+			/*
+			 * If this is the first execution, assume a default execution
+			 * TODO: Enhance module specification to provide "seed" value of estimated duration
+			 * TODO: Should we "rate limit" or only admit one request before we have actual data? Otherwise
+			 * we might be flooded with sandboxes that possibly underestimate
+			 */
+			if (estimated_execution == -1) estimated_execution = 1000;
+
+			double admissions_estimate = (double)estimated_execution / module->relative_deadline;
+
+			/*
+			 * Reject Requests that exceed system capacity
+			 * TODO: Enhance to gracefully return HTTP status code 503 Service Unavailable
+			 */
+			if (runtime_admitted + admissions_estimate >= runtime_worker_threads_count) {
+				debuglog("Would have rejected!");
+			}
+
 			/* Allocate a Sandbox Request */
 			struct sandbox_request *sandbox_request =
 			  sandbox_request_allocate(module, module->name, socket_descriptor,
-			                           (const struct sockaddr *)&client_address, request_arrival_timestamp);
+			                           (const struct sockaddr *)&client_address, request_arrival_timestamp,
+			                           admissions_estimate);
 			assert(sandbox_request);

 			/* Add to the Global Sandbox Request Scheduler */
 			global_request_scheduler_add(sandbox_request);
+
+			/* Add to work accepted by the runtime */
+			runtime_admitted += admissions_estimate;
+			debuglog("Runtime Utilization: %f%%\n", runtime_admitted / runtime_worker_threads_count * 100);
 		}
 	}

--- a/runtime/src/sandbox.c
+++ b/runtime/src/sandbox.c
@ -454,6 +454,8 @@ sandbox_set_as_initialized(struct sandbox *sandbox, struct sandbox_request *sand

 	debuglog("Sandbox %lu | Uninitialized => Initialized\n", sandbox->request_arrival_timestamp);

+	sandbox->admissions_estimate = sandbox_request->admissions_estimate;
+
 	sandbox->request_arrival_timestamp   = sandbox_request->request_arrival_timestamp;
 	sandbox->allocation_timestamp        = allocation_timestamp;
 	sandbox->last_state_change_timestamp = allocation_timestamp;
@ -731,6 +733,11 @@ sandbox_set_as_error(struct sandbox *sandbox, sandbox_state_t last_state)

 	sandbox_print_perf(sandbox);

+	runtime_admitted -= sandbox->admissions_estimate;
+	assert(runtime_admitted >= 0);
+
+	debuglog("Runtime Utilization: %f%%\n", runtime_admitted / runtime_worker_threads_count * 100);
+
 	/* Do not touch sandbox state after adding to the completion queue to avoid use-after-free bugs */
 	local_completion_queue_add(sandbox);
 }
@ -768,6 +775,17 @@ sandbox_set_as_complete(struct sandbox *sandbox, sandbox_state_t last_state)
 	sandbox->last_state_change_timestamp = now;
 	sandbox->state                       = SANDBOX_COMPLETE;

+	/*
+	 * TODO: Enhance to include "spinning" or better "local|global scheduling latency" as well.
+	 * Given the async I/O model of libuv, it is ambiguous how to model "spinning"
+	 */
+	perf_window_add(&sandbox->module->perf_window, sandbox->running_duration);
+
+	runtime_admitted -= sandbox->admissions_estimate;
+	assert(runtime_admitted >= 0);
+
+	debuglog("Runtime Utilization: %f%%\n", runtime_admitted / runtime_worker_threads_count * 100);
+
 	sandbox_print_perf(sandbox);

 	/* Do not touch sandbox state after adding to the completion queue to avoid use-after-free bugs */