Disable aux stack allocations for threads spawned by wasi_thread_start (#1867)

This syscall doesn't need allocating stack or TLS and it's expected from the application
to do that instead. E.g. WASI-libc already does this for `pthread_create`.

Also fix some of the examples to allocate memory for stack and not use stack before
the stack pointer is set to a correct value.
This commit is contained in:
Marcin Kolny 2023-01-09 12:36:34 +00:00 committed by GitHub
parent 2615646c20
commit 0e2382a959
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
12 changed files with 163 additions and 56 deletions

View File

@ -179,6 +179,13 @@ wasm_exec_env_create(struct WASMModuleInstanceCommon *module_inst,
void void
wasm_exec_env_destroy(WASMExecEnv *exec_env); wasm_exec_env_destroy(WASMExecEnv *exec_env);
static inline bool
wasm_exec_env_is_aux_stack_managed_by_runtime(WASMExecEnv *exec_env)
{
return exec_env->aux_stack_boundary.boundary != 0
|| exec_env->aux_stack_bottom.bottom != 0;
}
/** /**
* Allocate a WASM frame from the WASM stack. * Allocate a WASM frame from the WASM stack.
* *

View File

@ -1783,14 +1783,18 @@ wasm_interp_call_func_bytecode(WASMModuleInstance *module,
global = globals + global_idx; global = globals + global_idx;
global_addr = get_global_addr(global_data, global); global_addr = get_global_addr(global_data, global);
aux_stack_top = *(uint32 *)(frame_sp - 1); aux_stack_top = *(uint32 *)(frame_sp - 1);
if (aux_stack_top <= exec_env->aux_stack_boundary.boundary) { if (wasm_exec_env_is_aux_stack_managed_by_runtime(exec_env)) {
wasm_set_exception(module, "wasm auxiliary stack overflow"); if (aux_stack_top
goto got_exception; <= exec_env->aux_stack_boundary.boundary) {
} wasm_set_exception(module,
if (aux_stack_top > exec_env->aux_stack_bottom.bottom) { "wasm auxiliary stack overflow");
wasm_set_exception(module, goto got_exception;
"wasm auxiliary stack underflow"); }
goto got_exception; if (aux_stack_top > exec_env->aux_stack_bottom.bottom) {
wasm_set_exception(module,
"wasm auxiliary stack underflow");
goto got_exception;
}
} }
*(int32 *)global_addr = aux_stack_top; *(int32 *)global_addr = aux_stack_top;
frame_sp--; frame_sp--;

View File

@ -1576,14 +1576,18 @@ wasm_interp_call_func_bytecode(WASMModuleInstance *module,
global = globals + global_idx; global = globals + global_idx;
global_addr = get_global_addr(global_data, global); global_addr = get_global_addr(global_data, global);
aux_stack_top = frame_lp[GET_OFFSET()]; aux_stack_top = frame_lp[GET_OFFSET()];
if (aux_stack_top <= exec_env->aux_stack_boundary.boundary) { if (wasm_exec_env_is_aux_stack_managed_by_runtime(exec_env)) {
wasm_set_exception(module, "wasm auxiliary stack overflow"); if (aux_stack_top
goto got_exception; <= exec_env->aux_stack_boundary.boundary) {
} wasm_set_exception(module,
if (aux_stack_top > exec_env->aux_stack_bottom.bottom) { "wasm auxiliary stack overflow");
wasm_set_exception(module, goto got_exception;
"wasm auxiliary stack underflow"); }
goto got_exception; if (aux_stack_top > exec_env->aux_stack_bottom.bottom) {
wasm_set_exception(module,
"wasm auxiliary stack underflow");
goto got_exception;
}
} }
*(int32 *)global_addr = aux_stack_top; *(int32 *)global_addr = aux_stack_top;
#if WASM_ENABLE_MEMORY_PROFILING != 0 #if WASM_ENABLE_MEMORY_PROFILING != 0

View File

@ -619,8 +619,9 @@ pthread_create_wrapper(wasm_exec_env_t exec_env,
routine_args->module_inst = new_module_inst; routine_args->module_inst = new_module_inst;
os_mutex_lock(&exec_env->wait_lock); os_mutex_lock(&exec_env->wait_lock);
ret = wasm_cluster_create_thread( ret =
exec_env, new_module_inst, pthread_start_routine, (void *)routine_args); wasm_cluster_create_thread(exec_env, new_module_inst, true,
pthread_start_routine, (void *)routine_args);
if (ret != 0) { if (ret != 0) {
os_mutex_unlock(&exec_env->wait_lock); os_mutex_unlock(&exec_env->wait_lock);
goto fail; goto fail;

View File

@ -126,8 +126,8 @@ thread_spawn_wrapper(wasm_exec_env_t exec_env, uint32 start_arg)
thread_start_arg->start_func = start_func; thread_start_arg->start_func = start_func;
os_mutex_lock(&exec_env->wait_lock); os_mutex_lock(&exec_env->wait_lock);
ret = wasm_cluster_create_thread(exec_env, new_module_inst, thread_start, ret = wasm_cluster_create_thread(exec_env, new_module_inst, false,
thread_start_arg); thread_start, thread_start_arg);
if (ret != 0) { if (ret != 0) {
LOG_ERROR("Failed to spawn a new thread"); LOG_ERROR("Failed to spawn a new thread");
goto thread_spawn_fail; goto thread_spawn_fail;

View File

@ -125,6 +125,10 @@ free_aux_stack(WASMExecEnv *exec_env, uint32 start)
WASMModuleInstanceCommon *module_inst = WASMModuleInstanceCommon *module_inst =
wasm_exec_env_get_module_inst(exec_env); wasm_exec_env_get_module_inst(exec_env);
if (!wasm_exec_env_is_aux_stack_managed_by_runtime(exec_env)) {
return true;
}
bh_assert(start >= cluster->stack_size); bh_assert(start >= cluster->stack_size);
wasm_runtime_module_free(module_inst, start - cluster->stack_size); wasm_runtime_module_free(module_inst, start - cluster->stack_size);
@ -534,7 +538,7 @@ thread_manager_start_routine(void *arg)
int32 int32
wasm_cluster_create_thread(WASMExecEnv *exec_env, wasm_cluster_create_thread(WASMExecEnv *exec_env,
wasm_module_inst_t module_inst, wasm_module_inst_t module_inst, bool alloc_aux_stack,
void *(*thread_routine)(void *), void *arg) void *(*thread_routine)(void *), void *arg)
{ {
WASMCluster *cluster; WASMCluster *cluster;
@ -550,16 +554,18 @@ wasm_cluster_create_thread(WASMExecEnv *exec_env,
if (!new_exec_env) if (!new_exec_env)
return -1; return -1;
if (!allocate_aux_stack(exec_env, &aux_stack_start, &aux_stack_size)) { if (alloc_aux_stack) {
LOG_ERROR("thread manager error: " if (!allocate_aux_stack(exec_env, &aux_stack_start, &aux_stack_size)) {
"failed to allocate aux stack space for new thread"); LOG_ERROR("thread manager error: "
goto fail1; "failed to allocate aux stack space for new thread");
} goto fail1;
}
/* Set aux stack for current thread */ /* Set aux stack for current thread */
if (!wasm_exec_env_set_aux_stack(new_exec_env, aux_stack_start, if (!wasm_exec_env_set_aux_stack(new_exec_env, aux_stack_start,
aux_stack_size)) { aux_stack_size)) {
goto fail2; goto fail2;
}
} }
if (!wasm_cluster_add_exec_env(cluster, new_exec_env)) if (!wasm_cluster_add_exec_env(cluster, new_exec_env))
@ -581,7 +587,8 @@ fail3:
wasm_cluster_del_exec_env(cluster, new_exec_env); wasm_cluster_del_exec_env(cluster, new_exec_env);
fail2: fail2:
/* free the allocated aux stack space */ /* free the allocated aux stack space */
free_aux_stack(exec_env, aux_stack_start); if (alloc_aux_stack)
free_aux_stack(exec_env, aux_stack_start);
fail1: fail1:
wasm_exec_env_destroy(new_exec_env); wasm_exec_env_destroy(new_exec_env);
return -1; return -1;

View File

@ -64,7 +64,7 @@ wasm_exec_env_get_cluster(WASMExecEnv *exec_env);
int32 int32
wasm_cluster_create_thread(WASMExecEnv *exec_env, wasm_cluster_create_thread(WASMExecEnv *exec_env,
wasm_module_inst_t module_inst, wasm_module_inst_t module_inst, bool alloc_aux_stack,
void *(*thread_routine)(void *), void *arg); void *(*thread_routine)(void *), void *arg);
int32 int32

View File

@ -13,12 +13,13 @@ endif ()
set (CMAKE_SYSROOT "${WASI_SYSROOT}") set (CMAKE_SYSROOT "${WASI_SYSROOT}")
set (CMAKE_C_COMPILER "${WASI_SDK_DIR}/bin/clang") set (CMAKE_C_COMPILER "${WASI_SDK_DIR}/bin/clang")
set (CMAKE_ASM_COMPILER "${WASI_SDK_DIR}/bin/clang")
set (CMAKE_C_COMPILER_TARGET "wasm32-wasi") set (CMAKE_C_COMPILER_TARGET "wasm32-wasi")
function (compile_sample SOURCE_FILE) function (compile_sample SOURCE_FILE)
get_filename_component (FILE_NAME ${SOURCE_FILE} NAME_WLE) get_filename_component (FILE_NAME ${SOURCE_FILE} NAME_WLE)
set (WASM_MODULE ${FILE_NAME}.wasm) set (WASM_MODULE ${FILE_NAME}.wasm)
add_executable (${WASM_MODULE} ${SOURCE_FILE}) add_executable (${WASM_MODULE} ${SOURCE_FILE} ${ARGN})
target_compile_options (${WASM_MODULE} PRIVATE target_compile_options (${WASM_MODULE} PRIVATE
-pthread -ftls-model=local-exec) -pthread -ftls-model=local-exec)
@ -34,5 +35,5 @@ function (compile_sample SOURCE_FILE)
) )
endfunction () endfunction ()
compile_sample(no_pthread.c) compile_sample(no_pthread.c wasi_thread_start.S)
compile_sample(exception_propagation.c) compile_sample(exception_propagation.c wasi_thread_start.S)

View File

@ -9,15 +9,21 @@
#include <stdlib.h> #include <stdlib.h>
#include <stdio.h> #include <stdio.h>
#include <assert.h> #include <assert.h>
#include <wasi/api.h>
#include <semaphore.h> #include <semaphore.h>
#include <stdbool.h> #include <stdbool.h>
#include <unistd.h> #include <unistd.h>
#include "wasi_thread_start.h"
#define TIMEOUT_SECONDS 10 #define TIMEOUT_SECONDS 10
#define NUM_THREADS 3 #define NUM_THREADS 3
static sem_t sem; static sem_t sem;
typedef struct {
start_args_t base;
bool throw_exception;
} shared_t;
void void
run_long_task() run_long_task()
{ {
@ -26,12 +32,12 @@ run_long_task()
sleep(1); sleep(1);
} }
__attribute__((export_name("wasi_thread_start"))) void void
wasi_thread_start(int thread_id, int *start_arg) __wasi_thread_start_C(int thread_id, int *start_arg)
{ {
bool has_to_throw_exception = (bool)start_arg; shared_t *data = (shared_t *)start_arg;
if (has_to_throw_exception) { if (data->throw_exception) {
// Wait for all other threads (including main thread) to be ready // Wait for all other threads (including main thread) to be ready
printf("Waiting before throwing exception\n"); printf("Waiting before throwing exception\n");
for (int i = 0; i < NUM_THREADS; i++) for (int i = 0; i < NUM_THREADS; i++)
@ -52,26 +58,36 @@ wasi_thread_start(int thread_id, int *start_arg)
int int
main(int argc, char **argv) main(int argc, char **argv)
{ {
int thread_id = -1; int thread_id = -1, i;
shared_t data[NUM_THREADS] = { 0 };
if (sem_init(&sem, 0, 0) != 0) { if (sem_init(&sem, 0, 0) != 0) {
printf("Failed to init semaphore\n"); printf("Failed to init semaphore\n");
return EXIT_FAILURE; return EXIT_FAILURE;
} }
// Create a thread that throws an exception for (i = 0; i < NUM_THREADS; i++) {
thread_id = __wasi_thread_spawn((void *)true); // No graceful memory free to simplify the example
if (thread_id < 0) { if (!start_args_init(&data[i].base)) {
printf("Failed to create thread: %d\n", thread_id); printf("Failed to allocate thread's stack\n");
return EXIT_FAILURE; return EXIT_FAILURE;
}
} }
// Create two additional threads to test exception propagation // Create a thread that throws an exception
thread_id = __wasi_thread_spawn((void *)false); data[0].throw_exception = true;
thread_id = __wasi_thread_spawn(&data[0]);
if (thread_id < 0) { if (thread_id < 0) {
printf("Failed to create thread: %d\n", thread_id); printf("Failed to create thread: %d\n", thread_id);
return EXIT_FAILURE; return EXIT_FAILURE;
} }
thread_id = __wasi_thread_spawn((void *)false); // Create two additional threads to test exception propagation
thread_id = __wasi_thread_spawn(&data[1]);
if (thread_id < 0) {
printf("Failed to create thread: %d\n", thread_id);
return EXIT_FAILURE;
}
thread_id = __wasi_thread_spawn(&data[2]);
if (thread_id < 0) { if (thread_id < 0) {
printf("Failed to create thread: %d\n", thread_id); printf("Failed to create thread: %d\n", thread_id);
return EXIT_FAILURE; return EXIT_FAILURE;

View File

@ -9,18 +9,20 @@
#include <stdlib.h> #include <stdlib.h>
#include <stdio.h> #include <stdio.h>
#include <assert.h> #include <assert.h>
#include <wasi/api.h>
#include "wasi_thread_start.h"
static const int64_t SECOND = 1000 * 1000 * 1000; static const int64_t SECOND = 1000 * 1000 * 1000;
typedef struct { typedef struct {
start_args_t base;
int th_ready; int th_ready;
int value; int value;
int thread_id; int thread_id;
} shared_t; } shared_t;
__attribute__((export_name("wasi_thread_start"))) void void
wasi_thread_start(int thread_id, int *start_arg) __wasi_thread_start_C(int thread_id, int *start_arg)
{ {
shared_t *data = (shared_t *)start_arg; shared_t *data = (shared_t *)start_arg;
@ -38,18 +40,26 @@ wasi_thread_start(int thread_id, int *start_arg)
int int
main(int argc, char **argv) main(int argc, char **argv)
{ {
shared_t data = { 0, 52, -1 }; shared_t data = { { NULL }, 0, 52, -1 };
int thread_id; int thread_id;
int ret = EXIT_SUCCESS;
if (!start_args_init(&data.base)) {
printf("Stack allocation for thread failed\n");
return EXIT_FAILURE;
}
thread_id = __wasi_thread_spawn(&data); thread_id = __wasi_thread_spawn(&data);
if (thread_id < 0) { if (thread_id < 0) {
printf("Failed to create thread: %d\n", thread_id); printf("Failed to create thread: %d\n", thread_id);
return EXIT_FAILURE; ret = EXIT_FAILURE;
goto final;
} }
if (__builtin_wasm_memory_atomic_wait32(&data.th_ready, 0, SECOND) == 2) { if (__builtin_wasm_memory_atomic_wait32(&data.th_ready, 0, SECOND) == 2) {
printf("Timeout\n"); printf("Timeout\n");
return EXIT_FAILURE; ret = EXIT_FAILURE;
goto final;
} }
printf("Thread completed, new value: %d, thread id: %d\n", data.value, printf("Thread completed, new value: %d, thread id: %d\n", data.value,
@ -57,5 +67,8 @@ main(int argc, char **argv)
assert(thread_id == data.thread_id); assert(thread_id == data.thread_id);
return EXIT_SUCCESS; final:
start_args_deinit(&data.base);
return ret;
} }

View File

@ -0,0 +1,22 @@
# A slightly modified copy of the wasi-libc implementation
# https://github.com/WebAssembly/wasi-libc/pull/376/
.globaltype __stack_pointer, i32
.functype __wasi_thread_start_C (i32, i32) -> ()
.globl wasi_thread_start
wasi_thread_start:
.functype wasi_thread_start (i32, i32) -> ()
# Set up the minimum C environment.
# Note: offsetof(start_arg, stack) == 0
local.get 1 # start_arg
i32.load 0 # stack
global.set __stack_pointer
# Make the C function do the rest of work.
local.get 0 # tid
local.get 1 # start_arg
call __wasi_thread_start_C
end_function

View File

@ -0,0 +1,32 @@
/*
* Copyright (C) 2022 Amazon.com Inc. or its affiliates. All rights reserved.
* SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
*/
#ifndef WASI_THREAD_START_H
#define WASI_THREAD_START_H
#define STACK_SIZE 1024
typedef struct {
void *stack;
} start_args_t;
static inline int
start_args_init(start_args_t *start_args)
{
start_args->stack = malloc(STACK_SIZE);
if (!start_args->stack) {
return 0;
}
start_args->stack += STACK_SIZE;
return 1;
}
static inline void
start_args_deinit(start_args_t *start_args)
{
free(start_args->stack - STACK_SIZE);
}
#endif