/* Copyright (C) 2012 Monty Program Ab This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; version 2 of the License. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */ #ifdef _WIN32_WINNT #undef _WIN32_WINNT #endif #define _WIN32_WINNT 0x0601 #include #include #include #include #include #include #include #include #include #include #include /* WEAK_SYMBOL(return_type, function_name, argument_type1,..,argument_typeN) Declare and load function pointer from kernel32. The name of the static variable that holds the function pointer is my_ This should be combined with #define my_ so that one could use Widows APIs transparently, without worrying whether they are present in a particular version or not. Of course, prior to use of any function there should be a check for correct Windows version, or check whether function pointer is not NULL. */ #define WEAK_SYMBOL(return_type, function, ...) \ typedef return_type (WINAPI *pFN_##function)(__VA_ARGS__); \ static pFN_##function my_##function = (pFN_##function) \ (GetProcAddress(GetModuleHandle("kernel32"),#function)) WEAK_SYMBOL(BOOL, SetThreadpoolStackInformation, PTP_POOL, PTP_POOL_STACK_INFORMATION); #define SetThreadpoolStackInformation my_SetThreadpoolStackInformation /* Log a warning */ static void tp_log_warning(const char *msg, const char *fct) { sql_print_warning("Threadpool: %s. %s failed (last error %d)",msg, fct, GetLastError()); } PTP_POOL pool; DWORD fls; static bool skip_completion_port_on_success = false; /* Threadpool callbacks. io_completion_callback - handle client request timer_callback - handle wait timeout (kill connection) shm_read_callback, shm_close_callback - shared memory stuff login_callback - user login (submitted as threadpool work) */ static void CALLBACK timer_callback(PTP_CALLBACK_INSTANCE instance, PVOID context, PTP_TIMER timer); static void CALLBACK io_completion_callback(PTP_CALLBACK_INSTANCE instance, PVOID context, PVOID overlapped, ULONG io_result, ULONG_PTR nbytes, PTP_IO io); static void CALLBACK shm_read_callback(PTP_CALLBACK_INSTANCE instance, PVOID Context, PTP_WAIT wait,TP_WAIT_RESULT wait_result); static void CALLBACK shm_close_callback(PTP_CALLBACK_INSTANCE instance, PVOID Context, PTP_WAIT wait,TP_WAIT_RESULT wait_result); static void check_thread_init(); /* Get current time as Windows time */ static ulonglong now() { ulonglong current_time; GetSystemTimeAsFileTime((PFILETIME)¤t_time); return current_time; } /* Connection structure, encapsulates THD + structures for asynchronous IO and pool. */ struct connection_t { THD *thd; HANDLE handle; OVERLAPPED overlapped; /* absolute time for wait timeout (as Windows time) */ volatile ulonglong timeout; TP_CALLBACK_ENVIRON callback_environ; PTP_IO io; PTP_TIMER timer; PTP_WAIT shm_read; /* Callback instance, used to inform treadpool about long callbacks */ PTP_CALLBACK_INSTANCE callback_instance; CONNECT* connect; bool logged_in; }; void init_connection(connection_t *connection, CONNECT *connect) { connection->logged_in = false; connection->handle= 0; connection->io= 0; connection->shm_read= 0; connection->timer= 0; connection->logged_in = false; connection->timeout= ULONGLONG_MAX; connection->callback_instance= 0; connection->thd= 0; memset(&connection->overlapped, 0, sizeof(OVERLAPPED)); InitializeThreadpoolEnvironment(&connection->callback_environ); SetThreadpoolCallbackPool(&connection->callback_environ, pool); connection->connect= connect; } int init_io(connection_t *connection, THD *thd) { connection->thd= thd; Vio *vio = thd->net.vio; switch(vio->type) { case VIO_TYPE_SSL: case VIO_TYPE_TCPIP: connection->handle= (HANDLE)mysql_socket_getfd(connection->thd->net.vio->mysql_socket); break; case VIO_TYPE_NAMEDPIPE: connection->handle= (HANDLE)vio->hPipe; break; case VIO_TYPE_SHARED_MEMORY: connection->shm_read= CreateThreadpoolWait(shm_read_callback, connection, &connection->callback_environ); if (!connection->shm_read) { tp_log_warning("Allocation failed", "CreateThreadpoolWait"); return -1; } break; default: abort(); } if (connection->handle) { /* Performance tweaks (s. MSDN documentation)*/ UCHAR flags= FILE_SKIP_SET_EVENT_ON_HANDLE; if (skip_completion_port_on_success) { flags |= FILE_SKIP_COMPLETION_PORT_ON_SUCCESS; } (void)SetFileCompletionNotificationModes(connection->handle, flags); /* Assign io completion callback */ connection->io= CreateThreadpoolIo(connection->handle, io_completion_callback, connection, &connection->callback_environ); if(!connection->io) { tp_log_warning("Allocation failed", "CreateThreadpoolWait"); return -1; } } connection->timer= CreateThreadpoolTimer(timer_callback, connection, &connection->callback_environ); if (!connection->timer) { tp_log_warning("Allocation failed", "CreateThreadpoolWait"); return -1; } return 0; } /* Start asynchronous read */ int start_io(connection_t *connection, PTP_CALLBACK_INSTANCE instance) { /* Start async read */ DWORD num_bytes = 0; static char c; WSABUF buf; buf.buf= &c; buf.len= 0; DWORD flags=0; DWORD last_error= 0; int retval; Vio *vio= connection->thd->net.vio; if (vio->type == VIO_TYPE_SHARED_MEMORY) { SetThreadpoolWait(connection->shm_read, vio->event_server_wrote, NULL); return 0; } if (vio->type == VIO_CLOSED) { return -1; } DBUG_ASSERT(vio->type == VIO_TYPE_TCPIP || vio->type == VIO_TYPE_SSL || vio->type == VIO_TYPE_NAMEDPIPE); OVERLAPPED *overlapped= &connection->overlapped; PTP_IO io= connection->io; StartThreadpoolIo(io); if (vio->type == VIO_TYPE_TCPIP || vio->type == VIO_TYPE_SSL) { /* Start async io (sockets). */ if (WSARecv(mysql_socket_getfd(vio->mysql_socket) , &buf, 1, &num_bytes, &flags, overlapped, NULL) == 0) { retval= last_error= 0; } else { retval= -1; last_error= WSAGetLastError(); } } else { /* Start async io (named pipe) */ if (ReadFile(vio->hPipe, &c, 0, &num_bytes ,overlapped)) { retval= last_error= 0; } else { retval= -1; last_error= GetLastError(); } } if (retval == 0 || last_error == ERROR_MORE_DATA) { /* IO successfully finished (synchronously). If skip_completion_port_on_success is set, we need to handle it right here, because completion callback would not be executed by the pool. */ if(skip_completion_port_on_success) { CancelThreadpoolIo(io); io_completion_callback(instance, connection, overlapped, last_error, num_bytes, io); } return 0; } if(last_error == ERROR_IO_PENDING) { return 0; } /* Some error occurred */ CancelThreadpoolIo(io); return -1; } int login(connection_t *connection, PTP_CALLBACK_INSTANCE instance) { if ((connection->thd= threadpool_add_connection(connection->connect, connection)) && init_io(connection, connection->thd) == 0 && start_io(connection, instance) == 0) { return 0; } return -1; } /* Recalculate wait timeout, maybe reset timer. */ void set_wait_timeout(connection_t *connection, ulonglong old_timeout) { ulonglong new_timeout = now() + 10000000LL*connection->thd->variables.net_wait_timeout; if (new_timeout < old_timeout) { SetThreadpoolTimer(connection->timer, (PFILETIME) &new_timeout, 0, 1000); } connection->timeout = new_timeout; } /* Connection destructor */ void destroy_connection(connection_t *connection, PTP_CALLBACK_INSTANCE instance) { if (instance) DisassociateCurrentThreadFromCallback(instance); if (connection->io) { WaitForThreadpoolIoCallbacks(connection->io, TRUE); CloseThreadpoolIo(connection->io); } if(connection->shm_read) { WaitForThreadpoolWaitCallbacks(connection->shm_read, TRUE); CloseThreadpoolWait(connection->shm_read); } if(connection->timer) { SetThreadpoolTimer(connection->timer, 0, 0, 0); WaitForThreadpoolTimerCallbacks(connection->timer, TRUE); CloseThreadpoolTimer(connection->timer); } if (connection->thd) { threadpool_remove_connection(connection->thd); } DestroyThreadpoolEnvironment(&connection->callback_environ); } /* This function should be called first whenever a callback is invoked in the threadpool, does my_thread_init() if not yet done */ extern ulong thread_created; static void check_thread_init() { if (FlsGetValue(fls) == NULL) { FlsSetValue(fls, (void *)1); statistic_increment(thread_created, &LOCK_status); InterlockedIncrement((volatile long *)&tp_stats.num_worker_threads); } } /* Decrement number of threads when a thread exits . On Windows, FlsAlloc() provides the thread destruction callbacks. */ static VOID WINAPI thread_destructor(void *data) { if(data) { InterlockedDecrement((volatile long *)&tp_stats.num_worker_threads); } } /* Scheduler callback : init */ bool tp_init(void) { fls= FlsAlloc(thread_destructor); pool= CreateThreadpool(NULL); if(!pool) { sql_print_error("Can't create threadpool. " "CreateThreadpool() failed with %d. Likely cause is memory pressure", GetLastError()); exit(1); } if (threadpool_max_threads) { SetThreadpoolThreadMaximum(pool,threadpool_max_threads); } if (threadpool_min_threads) { if (!SetThreadpoolThreadMinimum(pool, threadpool_min_threads)) { tp_log_warning( "Can't set threadpool minimum threads", "SetThreadpoolThreadMinimum"); } } /* Control stack size (OS must be Win7 or later, plus corresponding SDK) */ #if _MSC_VER >=1600 if (SetThreadpoolStackInformation) { TP_POOL_STACK_INFORMATION stackinfo; stackinfo.StackCommit = 0; stackinfo.StackReserve = (SIZE_T)my_thread_stack_size; if (!SetThreadpoolStackInformation(pool, &stackinfo)) { tp_log_warning("Can't set threadpool stack size", "SetThreadpoolStackInformation"); } } #endif return 0; } /** Scheduler callback : Destroy the scheduler. */ void tp_end(void) { if(pool) { SetThreadpoolThreadMaximum(pool, 0); CloseThreadpool(pool); } } /* Handle read completion/notification. */ static VOID CALLBACK io_completion_callback(PTP_CALLBACK_INSTANCE instance, PVOID context, PVOID overlapped, ULONG io_result, ULONG_PTR nbytes, PTP_IO io) { if(instance) { check_thread_init(); } connection_t *connection = (connection_t*)context; if (io_result != ERROR_SUCCESS) goto error; THD *thd= connection->thd; ulonglong old_timeout = connection->timeout; connection->timeout = ULONGLONG_MAX; connection->callback_instance= instance; if (threadpool_process_request(connection->thd)) goto error; set_wait_timeout(connection, old_timeout); if(start_io(connection, instance)) goto error; return; error: /* Some error has occurred. */ destroy_connection(connection, instance); free(connection); } /* Simple callback for login */ static void CALLBACK login_callback(PTP_CALLBACK_INSTANCE instance, PVOID context, PTP_WORK work) { if(instance) { check_thread_init(); } connection_t *connection =(connection_t *)context; if (login(connection, instance) != 0) { destroy_connection(connection, instance); free(connection); } } /* Timer callback. Invoked when connection times out (wait_timeout) */ static VOID CALLBACK timer_callback(PTP_CALLBACK_INSTANCE instance, PVOID parameter, PTP_TIMER timer) { check_thread_init(); connection_t *con= (connection_t*)parameter; ulonglong timeout= con->timeout; if (timeout <= now()) { con->thd->killed = KILL_CONNECTION; if(con->thd->net.vio) vio_shutdown(con->thd->net.vio, SD_BOTH); } else if(timeout != ULONGLONG_MAX) { /* Reset timer. There is a tiny possibility of a race condition, since the value of timeout could have changed to smaller value in the thread doing io callback. Given the relative unimportance of the wait timeout, we accept race condition. */ SetThreadpoolTimer(timer, (PFILETIME)&timeout, 0, 1000); } } /* Shared memory read callback. Invoked when read event is set on connection. */ static void CALLBACK shm_read_callback(PTP_CALLBACK_INSTANCE instance, PVOID context, PTP_WAIT wait,TP_WAIT_RESULT wait_result) { connection_t *con= (connection_t *)context; /* Disarm wait. */ SetThreadpoolWait(wait, NULL, NULL); /* This is an autoreset event, and one wakeup is eaten already by threadpool, and the current state is "not set". Thus we need to reset the event again, or vio_read will hang. */ HANDLE h = con->thd->net.vio->event_server_wrote; SetEvent(h); io_completion_callback(instance, context, NULL, 0, 0 , 0); } /* Notify the thread pool about a new connection. */ void tp_add_connection(CONNECT *connect) { connection_t *con; con= (connection_t *)malloc(sizeof(connection_t)); DBUG_EXECUTE_IF("simulate_failed_connection_1", free(con);con= 0; ); if (!con) { tp_log_warning("Allocation failed", "tp_add_connection"); connect->close_and_delete(); return; } init_connection(con, connect); /* Try to login asynchronously, using threads in the pool */ PTP_WORK wrk = CreateThreadpoolWork(login_callback,con, &con->callback_environ); if (wrk) { SubmitThreadpoolWork(wrk); CloseThreadpoolWork(wrk); } else { /* Likely memory pressure */ connect->close_and_delete(); } } /** Sets the number of idle threads the thread pool maintains in anticipation of new requests. */ void tp_set_min_threads(uint val) { if (pool) SetThreadpoolThreadMinimum(pool, val); } void tp_set_max_threads(uint val) { if (pool) SetThreadpoolThreadMaximum(pool, val); } void tp_wait_begin(THD *thd, int type) { DBUG_ASSERT(thd); /* Signal to the threadpool whenever callback can run long. Currently, binlog waits are a good candidate, its waits are really long */ if (type == THD_WAIT_BINLOG) { connection_t *connection= (connection_t *)thd->event_scheduler.data; if(connection && connection->callback_instance) { CallbackMayRunLong(connection->callback_instance); /* Reset instance, to avoid calling CallbackMayRunLong twice within the same callback (it is an error according to docs). */ connection->callback_instance= 0; } } } void tp_wait_end(THD *thd) { /* Do we need to do anything ? */ } /** Number of idle threads in pool. This info is not available in Windows implementation, thus function always returns 0. */ int tp_get_idle_thread_count() { return 0; }