swiftlang
diff --git a/‎configure.ac
Lines changed: 32 additions & 12 deletions b/‎configure.ac
Lines changed: 32 additions & 12 deletions
diff --git a/‎src/Makefile.am
Lines changed: 10 additions & 1 deletion b/‎src/Makefile.am
Lines changed: 10 additions & 1 deletion
diff --git a/‎src/event/workqueue.c
Lines changed: 287 additions & 0 deletions b/‎src/event/workqueue.c
Lines changed: 287 additions & 0 deletions
@@ -320,21 +320,41 @@ AS_IF([test -n "$apple_libpthread_source_path" -a -n "$apple_xnu_source_osfmk_pa
 AC_CHECK_HEADERS([pthread_machdep.h pthread/qos.h])
 
 # pthread_workqueues.
-# Look for own version first, then system version.
-AS_IF([test -f $srcdir/libpwq/configure.ac],
-  [AC_DEFINE(BUILD_OWN_PTHREAD_WORKQUEUES, 1, [Define if building pthread work queues from source])
-   ac_configure_args="--disable-libpwq-install $ac_configure_args"
-   AC_CONFIG_SUBDIRS([libpwq])
-   build_own_pthread_workqueues=true
+# Look for own version first, then for libpwq in our source tree, finally system version.
+AC_ARG_ENABLE([internal-libpwq],
+  [AS_HELP_STRING([--enable-internal-libpwq],
+    [Use libdispatch's own implementation of pthread workqueues.])],,
+  [case $target_os in
+      linux*)
+        enable_internal_libpwq=yes
+	    ;;
+      *)
+        enable_internal_libpwq=no
+   esac]
+)
+AS_IF([test "x$enable_internal_libpwq" = "xyes"],
+  [AC_DEFINE(HAVE_INTERNAL_PTHREAD_WORKQUEUE, 1, [Use libdispatch's own implementation of pthread_workqueue API])
    AC_DEFINE(HAVE_PTHREAD_WORKQUEUES, 1, [Define if pthread work queues are present])
-   have_pthread_workqueues=true],
-  [build_own_pthread_workqueues=false
-   AC_CHECK_HEADERS([pthread/workqueue_private.h pthread_workqueue.h],
-     [AC_DEFINE(HAVE_PTHREAD_WORKQUEUES, 1, [Define if pthread work queues are present])
+   have_internal_pthread_workqueues=true
+   have_pthread_workqueues=true
+   build_own_pthread_workqueues=false],
+  [have_internal_pthread_workqueues=false
+   AS_IF([test -f $srcdir/libpwq/configure.ac],
+     [AC_DEFINE(BUILD_OWN_PTHREAD_WORKQUEUES, 1, [Define if building pthread work queues from source])
+      ac_configure_args="--disable-libpwq-install $ac_configure_args"
+      AC_CONFIG_SUBDIRS([libpwq])
+      build_own_pthread_workqueues=true
+      AC_DEFINE(HAVE_PTHREAD_WORKQUEUES, 1, [Define if pthread work queues are present])
       have_pthread_workqueues=true],
-     [have_pthread_workqueues=false]
-   )]
+     [build_own_pthread_workqueues=false
+      AC_CHECK_HEADERS([pthread/workqueue_private.h pthread_workqueue.h],
+        [AC_DEFINE(HAVE_PTHREAD_WORKQUEUES, 1, [Define if pthread work queues are present])
+         have_pthread_workqueues=true],
+        [have_pthread_workqueues=false]
+      )]
+  )]
 )
+AM_CONDITIONAL(HAVE_INTERNAL_PTHREAD_WORKQUEUES, $have_internal_pthread_workqueues)
 AM_CONDITIONAL(BUILD_OWN_PTHREAD_WORKQUEUES, $build_own_pthread_workqueues)
 AM_CONDITIONAL(HAVE_PTHREAD_WORKQUEUES, $have_pthread_workqueues)
 
 
@@ -9,6 +9,12 @@ else
 lib_LTLIBRARIES=libdispatch.la
 endif
 
+if HAVE_INTERNAL_PTHREAD_WORKQUEUES
+INTERNAL_WORKQUEUE_SOURCES= 	\
+	event/workqueue.c		\
+	event/workqueue_internal.h
+endif
+
 libdispatch_la_SOURCES=			\
 	allocator.c			\
 	apply.c				\
@@ -60,7 +66,8 @@ libdispatch_la_SOURCES=			\
 	shims/perfmon.h			\
 	shims/time.h			\
 	shims/tsd.h			\
-	shims/yield.h
+	shims/yield.h			\
+	$(INTERNAL_WORKQUEUE_SOURCES)
 
 EXTRA_libdispatch_la_SOURCES=
 EXTRA_libdispatch_la_DEPENDENCIES=
@@ -77,6 +84,7 @@ AM_OBJCFLAGS=$(DISPATCH_CFLAGS) $(CBLOCKS_FLAGS)
 AM_CXXFLAGS=$(PTHREAD_WORKQUEUE_CFLAGS) $(DISPATCH_CFLAGS) $(CXXBLOCKS_FLAGS)
 AM_OBJCXXFLAGS=$(DISPATCH_CFLAGS) $(CXXBLOCKS_FLAGS)
 
+if !HAVE_INTERNAL_PTHREAD_WORKQUEUES
 if BUILD_OWN_PTHREAD_WORKQUEUES
   PTHREAD_WORKQUEUE_LIBS=$(top_builddir)/libpwq/libpthread_workqueue.la
   PTHREAD_WORKQUEUE_CFLAGS=-I$(top_srcdir)/libpwq/include
@@ -85,6 +93,7 @@ if HAVE_PTHREAD_WORKQUEUES
   PTHREAD_WORKQUEUE_LIBS=-lpthread_workqueue
 endif
 endif
+endif
 
 if BUILD_OWN_BLOCKS_RUNTIME
 libdispatch_la_SOURCES+= BlocksRuntime/data.c BlocksRuntime/runtime.c
 
@@ -0,0 +1,287 @@
+/*
+ * Copyright (c) 2017-2017 Apple Inc. All rights reserved.
+ *
+ * @APPLE_APACHE_LICENSE_HEADER_START@
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ *
+ * @APPLE_APACHE_LICENSE_HEADER_END@
+ */
+
+#include "internal.h"
+
+#if HAVE_INTERNAL_PTHREAD_WORKQUEUE
+
+/*
+ * dispatch_workq monitors the thread pool that is
+ * executing the work enqueued on libdispatch's pthread
+ * root queues and dynamically adjusts its size.
+ *
+ * The dynamic monitoring can be implemented using either
+ *   (a) low-frequency user-level approximation of the number of runnable
+ *       worker threads via reading the /proc file system
+ *   (b) a Linux kernel extension that hooks the process change handler
+ *       to accurately track the number of runnable normal worker threads
+ * Using either form of monitoring, if (i) there appears to be
+ * work available in the monitored pthread root queue, (ii) the
+ * number of runnable workers is below the target size for the pool,
+ * and (iii) the total number of worker threads is below an upper limit,
+ * then an additional worker thread will be added to the pool.
+ */
+
+#pragma mark static data for management subsystem
+
+#if DISPATCH_ENABLE_PWQ_KEXT
+/* Are we using user-level or kext based management? */
+static bool _dispatch_workq_kext_active;
+#endif
+
+/*
+ * State for the user-level monitoring of a workqueue.
+ */
+typedef struct dispatch_workq_manager_s {
+	/* The observed number of runnable registered workers */
+	int32_t runnable_workers;
+
+	/* The desired number of runnable registered workers */
+	int32_t target_runnable_workers;
+
+	/*
+     * Tracking of registered workers; all accesses must hold lock.
+     * Invariant: registered_workers[0]...registered_workers[num_registered_workers-1]
+     *   contain the pids of the workers that we are managing.
+     */
+	dispatch_unfair_lock_s registered_worker_lock;
+	pid_t *registered_workers;
+	int num_registered_workers;
+} dispatch_workq_manager_s, *dispatch_workq_manager_t;
+
+static dispatch_workq_manager_s _dispatch_workq_manager;
+
+#pragma mark inline helper functions
+
+DISPATCH_INLINE
+dispatch_workq_manager_t
+_dispatch_workq_get_default_manager() {
+	return &_dispatch_workq_manager;
+}
+
+DISPATCH_INLINE
+dispatch_queue_t
+_dispatch_workq_get_default_root_queue()
+{
+	return &_dispatch_root_queues[DISPATCH_ROOT_QUEUE_IDX_DEFAULT_QOS];
+}
+
+DISPATCH_INLINE
+bool
+_dispatch_workq_root_queue_has_work(dispatch_queue_t dq)
+{
+	return dq->dq_items_tail != NULL;
+}
+
+#pragma mark Implementation of the management subsystem.
+
+#define WORKQ_MAX_TRACKED_WORKERS DISPATCH_WORKQ_MAX_PTHREAD_COUNT
+#define WORKQ_OVERSUBSCRIBE_FACTOR 2
+
+static void _dispatch_workq_init_once(void *context DISPATCH_UNUSED);
+static dispatch_once_t _dispatch_workq_init_once_pred;
+
+bool
+dispatch_workq_worker_register(dispatch_queue_t root_q)
+{
+	if (root_q != _dispatch_workq_get_default_root_queue()) {
+		// Not tracked.
+		return false;
+	}
+
+	dispatch_once_f(&_dispatch_workq_init_once_pred, NULL, &_dispatch_workq_init_once);
+
+#if DISPATCH_ENABLE_PWQ_KEXT
+	if (_dispatch_workq_kext_active) {
+		_dispatch_workq_worker_register_kext();
+		return true;
+	}
+#endif
+	dispatch_workq_manager_t mgr = _dispatch_workq_get_default_manager();
+	bool rc;
+	int tid = syscall(SYS_gettid);
+	_dispatch_unfair_lock_lock(&mgr->registered_worker_lock);
+	if (mgr->num_registered_workers < WORKQ_MAX_TRACKED_WORKERS-1) {
+		int worker_id = mgr->num_registered_workers++;
+		mgr->registered_workers[worker_id] = tid;
+		rc = true;
+	} else {
+		rc = false;
+	}
+	_dispatch_unfair_lock_unlock(&mgr->registered_worker_lock);
+
+	return rc;
+}
+
+void
+dispatch_workq_worker_unregister(dispatch_queue_t root_q)
+{
+	if (root_q != _dispatch_workq_get_default_root_queue()) {
+		// Not tracked.
+		return;
+	}
+
+#if DISPATCH_ENABLE_PWQ_KEXT
+	if (_dispatch_workq_kext_active) {
+		_dispatch_workq_worker_register_kext();
+		return;
+	}
+#endif
+	dispatch_workq_manager_t mgr = _dispatch_workq_get_default_manager();
+	int tid = syscall(SYS_gettid);
+	_dispatch_unfair_lock_lock(&mgr->registered_worker_lock);
+	for (int i=0; i<mgr->num_registered_workers; i++) {
+		if (mgr->registered_workers[i] == tid) {
+			int last = mgr->num_registered_workers - 1;
+			mgr->registered_workers[i] = mgr->registered_workers[last];
+			mgr->registered_workers[last] = 0;
+			mgr->num_registered_workers--;
+			break;
+		}
+	}
+	_dispatch_unfair_lock_unlock(&mgr->registered_worker_lock);
+}
+
+
+/*
+ * For each pid that is a registered worker, read /proc/[pid]/stat
+ * to get a count of the number of them that are actually runnable.
+ * See the proc(5) man page for the format of the contents of /proc/[pid]/stat
+ */
+static void
+_dispatch_workq_count_runnable_workers(dispatch_workq_manager_t mgr)
+{
+	char path[128];
+	char buf[4096];
+	int running_count = 0;
+
+	memset(buf, 0, sizeof(buf));
+
+	_dispatch_unfair_lock_lock(&mgr->registered_worker_lock);
+
+	for (int i=0; i<mgr->num_registered_workers; i++) {
+		pid_t worker_pid = mgr->registered_workers[i];
+		int fd;
+		size_t bytes_read = -1;
+
+		int r = snprintf(path, sizeof(path), "/proc/%d/stat", worker_pid);
+		(void)dispatch_assume(r > 0 && r < sizeof(path));
+
+		fd = open(path, O_RDONLY | O_NONBLOCK);
+		if (unlikely(fd == -1)) {
+			// Unable to open file.
+			// Must mean worker exited uncleanly (without executing _dispatch_worker_unregister())
+			// Clean up by removing pid and decrementing number of registered workers
+			_dispatch_debug("workq: Unable to open /proc/%d/stat; removing worker from monitoring list", worker_pid);
+			int last = mgr->num_registered_workers-1;
+			mgr->registered_workers[i] = mgr->registered_workers[last];
+			mgr->registered_workers[last] = 0;
+			mgr->num_registered_workers--;
+		} else {
+			bytes_read = read(fd, buf, sizeof(buf));
+			(void)close(fd);
+		}
+
+		if (bytes_read > 0) {
+			char state;
+			if (sscanf(buf, "%*d %*s %c", &state) == 1) {
+				// _dispatch_debug("workq: The state of worker %d is %c\n", worker_pid, state);
+				if (state == 'R') {
+					running_count++;
+				}
+			} else {
+				_dispatch_debug("workq: Failed to scan state for worker %d", worker_pid);
+			}
+			memset(buf, 0, bytes_read);
+		} else {
+			_dispatch_debug("workq: Failed to read %s", path);
+		}
+	}
+
+	mgr->runnable_workers = running_count;
+
+	_dispatch_unfair_lock_unlock(&mgr->registered_worker_lock);
+}
+
+static void
+_dispatch_workq_monitor_thread_pool(void *context DISPATCH_UNUSED)
+{
+	dispatch_workq_manager_t mgr = _dispatch_workq_get_default_manager();
+	dispatch_queue_t dq = _dispatch_workq_get_default_root_queue();
+	bool work_available = _dispatch_workq_root_queue_has_work(dq);
+
+	if (!work_available) {
+		_dispatch_debug("workq: %s is empty; doing nothing", dq->dq_label);
+		return;
+	}
+
+	_dispatch_workq_count_runnable_workers(mgr);
+	int32_t count = _dispatch_pthread_root_queue_thread_pool_size(dq);
+
+	_dispatch_debug("workq: %s is non-empty with pool count %d (%d runnable)",
+			dq->dq_label, count,  mgr->runnable_workers);
+
+	if (mgr->runnable_workers < mgr->target_runnable_workers) {
+		// If we are below target there are two cases to consider:
+		//   (a) We are below target, but some workers are still runnable.
+		//       We want to oversubscribe to hit the target, but this
+		//       may be transitory so only go up to a small multiple
+		//       of threads per core.
+		//   (b) We are below target, and no worker is runnable.
+		//       It is likely the program is stalled. Therefore treat
+		//       this as dq was an overcommit queue and create
+		//       another worker unless we have already hit the hard
+		//       limit on the maximum number of workers for dq.
+		int32_t oversubscribe_limit = WORKQ_OVERSUBSCRIBE_FACTOR * mgr->target_runnable_workers;
+		int32_t stalled_limit = WORKQ_MAX_TRACKED_WORKERS - mgr->target_runnable_workers;
+		int32_t limit = mgr->runnable_workers == 0 ? stalled_limit : MIN(stalled_limit, oversubscribe_limit);
+		if (count + limit > 0) {
+			_dispatch_debug("workq: adding 1 additional worker to %s", dq->dq_label);
+			_dispatch_pthread_root_queue_oversubscribe(dq, 1);
+		} else {
+			_dispatch_debug("workq: %s already oversubscribed by %d; taking no action",
+					dq->dq_label, -count);
+		}
+	}
+}
+
+static void
+_dispatch_workq_init_once(void *context DISPATCH_UNUSED)
+{
+#if DISPATCH_ENABLE_PWQ_KEXT
+	// Initialize kext subsystem.
+	_dispatch_workq_kext_active = _dispatch_workq_management_init_kext();
+
+	if (_dispatch_workq_kext_active) {
+		return;
+	}
+#endif
+	dispatch_workq_manager_t mgr = _dispatch_workq_get_default_manager();
+	mgr->registered_workers = _dispatch_calloc(WORKQ_MAX_TRACKED_WORKERS, sizeof(pid_t));
+	mgr->target_runnable_workers = dispatch_hw_config(active_cpus);
+
+	// Create monitoring timer that will periodically run on dispatch_mgr_q
+	dispatch_source_t ds = dispatch_source_create(DISPATCH_SOURCE_TYPE_TIMER, 0, 0, &_dispatch_mgr_q);
+	dispatch_source_set_timer(ds, dispatch_time(DISPATCH_TIME_NOW, 0), NSEC_PER_SEC, 0);
+	dispatch_source_set_event_handler_f(ds, _dispatch_workq_monitor_thread_pool);
+	dispatch_activate(ds);
+}
+
+#endif // HAVE_INTERNAL_PTHREAD_WORKQUEUE