| #ifndef _LINUX_CLOSURE_H | 
 | #define _LINUX_CLOSURE_H | 
 |  | 
 | #include <linux/llist.h> | 
 | #include <linux/sched.h> | 
 | #include <linux/workqueue.h> | 
 |  | 
 | /* | 
 |  * Closure is perhaps the most overused and abused term in computer science, but | 
 |  * since I've been unable to come up with anything better you're stuck with it | 
 |  * again. | 
 |  * | 
 |  * What are closures? | 
 |  * | 
 |  * They embed a refcount. The basic idea is they count "things that are in | 
 |  * progress" - in flight bios, some other thread that's doing something else - | 
 |  * anything you might want to wait on. | 
 |  * | 
 |  * The refcount may be manipulated with closure_get() and closure_put(). | 
 |  * closure_put() is where many of the interesting things happen, when it causes | 
 |  * the refcount to go to 0. | 
 |  * | 
 |  * Closures can be used to wait on things both synchronously and asynchronously, | 
 |  * and synchronous and asynchronous use can be mixed without restriction. To | 
 |  * wait synchronously, use closure_sync() - you will sleep until your closure's | 
 |  * refcount hits 1. | 
 |  * | 
 |  * To wait asynchronously, use | 
 |  *   continue_at(cl, next_function, workqueue); | 
 |  * | 
 |  * passing it, as you might expect, the function to run when nothing is pending | 
 |  * and the workqueue to run that function out of. | 
 |  * | 
 |  * continue_at() also, critically, is a macro that returns the calling function. | 
 |  * There's good reason for this. | 
 |  * | 
 |  * To use safely closures asynchronously, they must always have a refcount while | 
 |  * they are running owned by the thread that is running them. Otherwise, suppose | 
 |  * you submit some bios and wish to have a function run when they all complete: | 
 |  * | 
 |  * foo_endio(struct bio *bio, int error) | 
 |  * { | 
 |  *	closure_put(cl); | 
 |  * } | 
 |  * | 
 |  * closure_init(cl); | 
 |  * | 
 |  * do_stuff(); | 
 |  * closure_get(cl); | 
 |  * bio1->bi_endio = foo_endio; | 
 |  * bio_submit(bio1); | 
 |  * | 
 |  * do_more_stuff(); | 
 |  * closure_get(cl); | 
 |  * bio2->bi_endio = foo_endio; | 
 |  * bio_submit(bio2); | 
 |  * | 
 |  * continue_at(cl, complete_some_read, system_wq); | 
 |  * | 
 |  * If closure's refcount started at 0, complete_some_read() could run before the | 
 |  * second bio was submitted - which is almost always not what you want! More | 
 |  * importantly, it wouldn't be possible to say whether the original thread or | 
 |  * complete_some_read()'s thread owned the closure - and whatever state it was | 
 |  * associated with! | 
 |  * | 
 |  * So, closure_init() initializes a closure's refcount to 1 - and when a | 
 |  * closure_fn is run, the refcount will be reset to 1 first. | 
 |  * | 
 |  * Then, the rule is - if you got the refcount with closure_get(), release it | 
 |  * with closure_put() (i.e, in a bio->bi_endio function). If you have a refcount | 
 |  * on a closure because you called closure_init() or you were run out of a | 
 |  * closure - _always_ use continue_at(). Doing so consistently will help | 
 |  * eliminate an entire class of particularly pernicious races. | 
 |  * | 
 |  * For a closure to wait on an arbitrary event, we need to introduce waitlists: | 
 |  * | 
 |  * struct closure_waitlist list; | 
 |  * closure_wait_event(list, cl, condition); | 
 |  * closure_wake_up(wait_list); | 
 |  * | 
 |  * These work analagously to wait_event() and wake_up() - except that instead of | 
 |  * operating on the current thread (for wait_event()) and lists of threads, they | 
 |  * operate on an explicit closure and lists of closures. | 
 |  * | 
 |  * Because it's a closure we can now wait either synchronously or | 
 |  * asynchronously. closure_wait_event() returns the current value of the | 
 |  * condition, and if it returned false continue_at() or closure_sync() can be | 
 |  * used to wait for it to become true. | 
 |  * | 
 |  * It's useful for waiting on things when you can't sleep in the context in | 
 |  * which you must check the condition (perhaps a spinlock held, or you might be | 
 |  * beneath generic_make_request() - in which case you can't sleep on IO). | 
 |  * | 
 |  * closure_wait_event() will wait either synchronously or asynchronously, | 
 |  * depending on whether the closure is in blocking mode or not. You can pick a | 
 |  * mode explicitly with closure_wait_event_sync() and | 
 |  * closure_wait_event_async(), which do just what you might expect. | 
 |  * | 
 |  * Lastly, you might have a wait list dedicated to a specific event, and have no | 
 |  * need for specifying the condition - you just want to wait until someone runs | 
 |  * closure_wake_up() on the appropriate wait list. In that case, just use | 
 |  * closure_wait(). It will return either true or false, depending on whether the | 
 |  * closure was already on a wait list or not - a closure can only be on one wait | 
 |  * list at a time. | 
 |  * | 
 |  * Parents: | 
 |  * | 
 |  * closure_init() takes two arguments - it takes the closure to initialize, and | 
 |  * a (possibly null) parent. | 
 |  * | 
 |  * If parent is non null, the new closure will have a refcount for its lifetime; | 
 |  * a closure is considered to be "finished" when its refcount hits 0 and the | 
 |  * function to run is null. Hence | 
 |  * | 
 |  * continue_at(cl, NULL, NULL); | 
 |  * | 
 |  * returns up the (spaghetti) stack of closures, precisely like normal return | 
 |  * returns up the C stack. continue_at() with non null fn is better thought of | 
 |  * as doing a tail call. | 
 |  * | 
 |  * All this implies that a closure should typically be embedded in a particular | 
 |  * struct (which its refcount will normally control the lifetime of), and that | 
 |  * struct can very much be thought of as a stack frame. | 
 |  * | 
 |  * Locking: | 
 |  * | 
 |  * Closures are based on work items but they can be thought of as more like | 
 |  * threads - in that like threads and unlike work items they have a well | 
 |  * defined lifetime; they are created (with closure_init()) and eventually | 
 |  * complete after a continue_at(cl, NULL, NULL). | 
 |  * | 
 |  * Suppose you've got some larger structure with a closure embedded in it that's | 
 |  * used for periodically doing garbage collection. You only want one garbage | 
 |  * collection happening at a time, so the natural thing to do is protect it with | 
 |  * a lock. However, it's difficult to use a lock protecting a closure correctly | 
 |  * because the unlock should come after the last continue_to() (additionally, if | 
 |  * you're using the closure asynchronously a mutex won't work since a mutex has | 
 |  * to be unlocked by the same process that locked it). | 
 |  * | 
 |  * So to make it less error prone and more efficient, we also have the ability | 
 |  * to use closures as locks: | 
 |  * | 
 |  * closure_init_unlocked(); | 
 |  * closure_trylock(); | 
 |  * | 
 |  * That's all we need for trylock() - the last closure_put() implicitly unlocks | 
 |  * it for you.  But for closure_lock(), we also need a wait list: | 
 |  * | 
 |  * struct closure_with_waitlist frobnicator_cl; | 
 |  * | 
 |  * closure_init_unlocked(&frobnicator_cl); | 
 |  * closure_lock(&frobnicator_cl); | 
 |  * | 
 |  * A closure_with_waitlist embeds a closure and a wait list - much like struct | 
 |  * delayed_work embeds a work item and a timer_list. The important thing is, use | 
 |  * it exactly like you would a regular closure and closure_put() will magically | 
 |  * handle everything for you. | 
 |  */ | 
 |  | 
 | struct closure; | 
 | typedef void (closure_fn) (struct closure *); | 
 |  | 
 | struct closure_waitlist { | 
 | 	struct llist_head	list; | 
 | }; | 
 |  | 
 | enum closure_type { | 
 | 	TYPE_closure				= 0, | 
 | 	TYPE_closure_with_waitlist		= 1, | 
 | 	MAX_CLOSURE_TYPE			= 1, | 
 | }; | 
 |  | 
 | enum closure_state { | 
 | 	/* | 
 | 	 * CLOSURE_WAITING: Set iff the closure is on a waitlist. Must be set by | 
 | 	 * the thread that owns the closure, and cleared by the thread that's | 
 | 	 * waking up the closure. | 
 | 	 * | 
 | 	 * CLOSURE_SLEEPING: Must be set before a thread uses a closure to sleep | 
 | 	 * - indicates that cl->task is valid and closure_put() may wake it up. | 
 | 	 * Only set or cleared by the thread that owns the closure. | 
 | 	 * | 
 | 	 * The rest are for debugging and don't affect behaviour: | 
 | 	 * | 
 | 	 * CLOSURE_RUNNING: Set when a closure is running (i.e. by | 
 | 	 * closure_init() and when closure_put() runs then next function), and | 
 | 	 * must be cleared before remaining hits 0. Primarily to help guard | 
 | 	 * against incorrect usage and accidentally transferring references. | 
 | 	 * continue_at() and closure_return() clear it for you, if you're doing | 
 | 	 * something unusual you can use closure_set_dead() which also helps | 
 | 	 * annotate where references are being transferred. | 
 | 	 * | 
 | 	 * CLOSURE_STACK: Sanity check - remaining should never hit 0 on a | 
 | 	 * closure with this flag set | 
 | 	 */ | 
 |  | 
 | 	CLOSURE_BITS_START	= (1 << 23), | 
 | 	CLOSURE_DESTRUCTOR	= (1 << 23), | 
 | 	CLOSURE_WAITING		= (1 << 25), | 
 | 	CLOSURE_SLEEPING	= (1 << 27), | 
 | 	CLOSURE_RUNNING		= (1 << 29), | 
 | 	CLOSURE_STACK		= (1 << 31), | 
 | }; | 
 |  | 
 | #define CLOSURE_GUARD_MASK					\ | 
 | 	((CLOSURE_DESTRUCTOR|CLOSURE_WAITING|CLOSURE_SLEEPING|	\ | 
 | 	  CLOSURE_RUNNING|CLOSURE_STACK) << 1) | 
 |  | 
 | #define CLOSURE_REMAINING_MASK		(CLOSURE_BITS_START - 1) | 
 | #define CLOSURE_REMAINING_INITIALIZER	(1|CLOSURE_RUNNING) | 
 |  | 
 | struct closure { | 
 | 	union { | 
 | 		struct { | 
 | 			struct workqueue_struct *wq; | 
 | 			struct task_struct	*task; | 
 | 			struct llist_node	list; | 
 | 			closure_fn		*fn; | 
 | 		}; | 
 | 		struct work_struct	work; | 
 | 	}; | 
 |  | 
 | 	struct closure		*parent; | 
 |  | 
 | 	atomic_t		remaining; | 
 |  | 
 | 	enum closure_type	type; | 
 |  | 
 | #ifdef CONFIG_BCACHE_CLOSURES_DEBUG | 
 | #define CLOSURE_MAGIC_DEAD	0xc054dead | 
 | #define CLOSURE_MAGIC_ALIVE	0xc054a11e | 
 |  | 
 | 	unsigned		magic; | 
 | 	struct list_head	all; | 
 | 	unsigned long		ip; | 
 | 	unsigned long		waiting_on; | 
 | #endif | 
 | }; | 
 |  | 
 | struct closure_with_waitlist { | 
 | 	struct closure		cl; | 
 | 	struct closure_waitlist	wait; | 
 | }; | 
 |  | 
 | extern unsigned invalid_closure_type(void); | 
 |  | 
 | #define __CLOSURE_TYPE(cl, _t)						\ | 
 | 	  __builtin_types_compatible_p(typeof(cl), struct _t)		\ | 
 | 		? TYPE_ ## _t :						\ | 
 |  | 
 | #define __closure_type(cl)						\ | 
 | (									\ | 
 | 	__CLOSURE_TYPE(cl, closure)					\ | 
 | 	__CLOSURE_TYPE(cl, closure_with_waitlist)			\ | 
 | 	invalid_closure_type()						\ | 
 | ) | 
 |  | 
 | void closure_sub(struct closure *cl, int v); | 
 | void closure_put(struct closure *cl); | 
 | void __closure_wake_up(struct closure_waitlist *list); | 
 | bool closure_wait(struct closure_waitlist *list, struct closure *cl); | 
 | void closure_sync(struct closure *cl); | 
 |  | 
 | bool closure_trylock(struct closure *cl, struct closure *parent); | 
 | void __closure_lock(struct closure *cl, struct closure *parent, | 
 | 		    struct closure_waitlist *wait_list); | 
 |  | 
 | #ifdef CONFIG_BCACHE_CLOSURES_DEBUG | 
 |  | 
 | void closure_debug_init(void); | 
 | void closure_debug_create(struct closure *cl); | 
 | void closure_debug_destroy(struct closure *cl); | 
 |  | 
 | #else | 
 |  | 
 | static inline void closure_debug_init(void) {} | 
 | static inline void closure_debug_create(struct closure *cl) {} | 
 | static inline void closure_debug_destroy(struct closure *cl) {} | 
 |  | 
 | #endif | 
 |  | 
 | static inline void closure_set_ip(struct closure *cl) | 
 | { | 
 | #ifdef CONFIG_BCACHE_CLOSURES_DEBUG | 
 | 	cl->ip = _THIS_IP_; | 
 | #endif | 
 | } | 
 |  | 
 | static inline void closure_set_ret_ip(struct closure *cl) | 
 | { | 
 | #ifdef CONFIG_BCACHE_CLOSURES_DEBUG | 
 | 	cl->ip = _RET_IP_; | 
 | #endif | 
 | } | 
 |  | 
 | static inline void closure_get(struct closure *cl) | 
 | { | 
 | #ifdef CONFIG_BCACHE_CLOSURES_DEBUG | 
 | 	BUG_ON((atomic_inc_return(&cl->remaining) & | 
 | 		CLOSURE_REMAINING_MASK) <= 1); | 
 | #else | 
 | 	atomic_inc(&cl->remaining); | 
 | #endif | 
 | } | 
 |  | 
 | static inline void closure_set_stopped(struct closure *cl) | 
 | { | 
 | 	atomic_sub(CLOSURE_RUNNING, &cl->remaining); | 
 | } | 
 |  | 
 | static inline bool closure_is_unlocked(struct closure *cl) | 
 | { | 
 | 	return atomic_read(&cl->remaining) == -1; | 
 | } | 
 |  | 
 | static inline void do_closure_init(struct closure *cl, struct closure *parent, | 
 | 				   bool running) | 
 | { | 
 | 	cl->parent = parent; | 
 | 	if (parent) | 
 | 		closure_get(parent); | 
 |  | 
 | 	if (running) { | 
 | 		closure_debug_create(cl); | 
 | 		atomic_set(&cl->remaining, CLOSURE_REMAINING_INITIALIZER); | 
 | 	} else | 
 | 		atomic_set(&cl->remaining, -1); | 
 |  | 
 | 	closure_set_ip(cl); | 
 | } | 
 |  | 
 | /* | 
 |  * Hack to get at the embedded closure if there is one, by doing an unsafe cast: | 
 |  * the result of __closure_type() is thrown away, it's used merely for type | 
 |  * checking. | 
 |  */ | 
 | #define __to_internal_closure(cl)				\ | 
 | ({								\ | 
 | 	BUILD_BUG_ON(__closure_type(*cl) > MAX_CLOSURE_TYPE);	\ | 
 | 	(struct closure *) cl;					\ | 
 | }) | 
 |  | 
 | #define closure_init_type(cl, parent, running)			\ | 
 | do {								\ | 
 | 	struct closure *_cl = __to_internal_closure(cl);	\ | 
 | 	_cl->type = __closure_type(*(cl));			\ | 
 | 	do_closure_init(_cl, parent, running);			\ | 
 | } while (0) | 
 |  | 
 | /** | 
 |  * __closure_init() - Initialize a closure, skipping the memset() | 
 |  * | 
 |  * May be used instead of closure_init() when memory has already been zeroed. | 
 |  */ | 
 | #define __closure_init(cl, parent)				\ | 
 | 	closure_init_type(cl, parent, true) | 
 |  | 
 | /** | 
 |  * closure_init() - Initialize a closure, setting the refcount to 1 | 
 |  * @cl:		closure to initialize | 
 |  * @parent:	parent of the new closure. cl will take a refcount on it for its | 
 |  *		lifetime; may be NULL. | 
 |  */ | 
 | #define closure_init(cl, parent)				\ | 
 | do {								\ | 
 | 	memset((cl), 0, sizeof(*(cl)));				\ | 
 | 	__closure_init(cl, parent);				\ | 
 | } while (0) | 
 |  | 
 | static inline void closure_init_stack(struct closure *cl) | 
 | { | 
 | 	memset(cl, 0, sizeof(struct closure)); | 
 | 	atomic_set(&cl->remaining, CLOSURE_REMAINING_INITIALIZER|CLOSURE_STACK); | 
 | } | 
 |  | 
 | /** | 
 |  * closure_init_unlocked() - Initialize a closure but leave it unlocked. | 
 |  * @cl:		closure to initialize | 
 |  * | 
 |  * For when the closure will be used as a lock. The closure may not be used | 
 |  * until after a closure_lock() or closure_trylock(). | 
 |  */ | 
 | #define closure_init_unlocked(cl)				\ | 
 | do {								\ | 
 | 	memset((cl), 0, sizeof(*(cl)));				\ | 
 | 	closure_init_type(cl, NULL, false);			\ | 
 | } while (0) | 
 |  | 
 | /** | 
 |  * closure_lock() - lock and initialize a closure. | 
 |  * @cl:		the closure to lock | 
 |  * @parent:	the new parent for this closure | 
 |  * | 
 |  * The closure must be of one of the types that has a waitlist (otherwise we | 
 |  * wouldn't be able to sleep on contention). | 
 |  * | 
 |  * @parent has exactly the same meaning as in closure_init(); if non null, the | 
 |  * closure will take a reference on @parent which will be released when it is | 
 |  * unlocked. | 
 |  */ | 
 | #define closure_lock(cl, parent)				\ | 
 | 	__closure_lock(__to_internal_closure(cl), parent, &(cl)->wait) | 
 |  | 
 | static inline void __closure_end_sleep(struct closure *cl) | 
 | { | 
 | 	__set_current_state(TASK_RUNNING); | 
 |  | 
 | 	if (atomic_read(&cl->remaining) & CLOSURE_SLEEPING) | 
 | 		atomic_sub(CLOSURE_SLEEPING, &cl->remaining); | 
 | } | 
 |  | 
 | static inline void __closure_start_sleep(struct closure *cl) | 
 | { | 
 | 	closure_set_ip(cl); | 
 | 	cl->task = current; | 
 | 	set_current_state(TASK_UNINTERRUPTIBLE); | 
 |  | 
 | 	if (!(atomic_read(&cl->remaining) & CLOSURE_SLEEPING)) | 
 | 		atomic_add(CLOSURE_SLEEPING, &cl->remaining); | 
 | } | 
 |  | 
 | /** | 
 |  * closure_wake_up() - wake up all closures on a wait list. | 
 |  */ | 
 | static inline void closure_wake_up(struct closure_waitlist *list) | 
 | { | 
 | 	smp_mb(); | 
 | 	__closure_wake_up(list); | 
 | } | 
 |  | 
 | /* | 
 |  * Wait on an event, synchronously or asynchronously - analogous to wait_event() | 
 |  * but for closures. | 
 |  * | 
 |  * The loop is oddly structured so as to avoid a race; we must check the | 
 |  * condition again after we've added ourself to the waitlist. We know if we were | 
 |  * already on the waitlist because closure_wait() returns false; thus, we only | 
 |  * schedule or break if closure_wait() returns false. If it returns true, we | 
 |  * just loop again - rechecking the condition. | 
 |  * | 
 |  * The __closure_wake_up() is necessary because we may race with the event | 
 |  * becoming true; i.e. we see event false -> wait -> recheck condition, but the | 
 |  * thread that made the event true may have called closure_wake_up() before we | 
 |  * added ourself to the wait list. | 
 |  * | 
 |  * We have to call closure_sync() at the end instead of just | 
 |  * __closure_end_sleep() because a different thread might've called | 
 |  * closure_wake_up() before us and gotten preempted before they dropped the | 
 |  * refcount on our closure. If this was a stack allocated closure, that would be | 
 |  * bad. | 
 |  */ | 
 | #define closure_wait_event(list, cl, condition)				\ | 
 | ({									\ | 
 | 	typeof(condition) ret;						\ | 
 | 									\ | 
 | 	while (1) {							\ | 
 | 		ret = (condition);					\ | 
 | 		if (ret) {						\ | 
 | 			__closure_wake_up(list);			\ | 
 | 			closure_sync(cl);				\ | 
 | 			break;						\ | 
 | 		}							\ | 
 | 									\ | 
 | 		__closure_start_sleep(cl);				\ | 
 | 									\ | 
 | 		if (!closure_wait(list, cl))				\ | 
 | 			schedule();					\ | 
 | 	}								\ | 
 | 									\ | 
 | 	ret;								\ | 
 | }) | 
 |  | 
 | static inline void closure_queue(struct closure *cl) | 
 | { | 
 | 	struct workqueue_struct *wq = cl->wq; | 
 | 	if (wq) { | 
 | 		INIT_WORK(&cl->work, cl->work.func); | 
 | 		BUG_ON(!queue_work(wq, &cl->work)); | 
 | 	} else | 
 | 		cl->fn(cl); | 
 | } | 
 |  | 
 | static inline void set_closure_fn(struct closure *cl, closure_fn *fn, | 
 | 				  struct workqueue_struct *wq) | 
 | { | 
 | 	BUG_ON(object_is_on_stack(cl)); | 
 | 	closure_set_ip(cl); | 
 | 	cl->fn = fn; | 
 | 	cl->wq = wq; | 
 | 	/* between atomic_dec() in closure_put() */ | 
 | 	smp_mb__before_atomic_dec(); | 
 | } | 
 |  | 
 | #define continue_at(_cl, _fn, _wq)					\ | 
 | do {									\ | 
 | 	set_closure_fn(_cl, _fn, _wq);					\ | 
 | 	closure_sub(_cl, CLOSURE_RUNNING + 1);				\ | 
 | 	return;								\ | 
 | } while (0) | 
 |  | 
 | #define closure_return(_cl)	continue_at((_cl), NULL, NULL) | 
 |  | 
 | #define continue_at_nobarrier(_cl, _fn, _wq)				\ | 
 | do {									\ | 
 | 	set_closure_fn(_cl, _fn, _wq);					\ | 
 | 	closure_queue(_cl);						\ | 
 | 	return;								\ | 
 | } while (0) | 
 |  | 
 | #define closure_return_with_destructor(_cl, _destructor)		\ | 
 | do {									\ | 
 | 	set_closure_fn(_cl, _destructor, NULL);				\ | 
 | 	closure_sub(_cl, CLOSURE_RUNNING - CLOSURE_DESTRUCTOR + 1);	\ | 
 | 	return;								\ | 
 | } while (0) | 
 |  | 
 | static inline void closure_call(struct closure *cl, closure_fn fn, | 
 | 				struct workqueue_struct *wq, | 
 | 				struct closure *parent) | 
 | { | 
 | 	closure_init(cl, parent); | 
 | 	continue_at_nobarrier(cl, fn, wq); | 
 | } | 
 |  | 
 | static inline void closure_trylock_call(struct closure *cl, closure_fn fn, | 
 | 					struct workqueue_struct *wq, | 
 | 					struct closure *parent) | 
 | { | 
 | 	if (closure_trylock(cl, parent)) | 
 | 		continue_at_nobarrier(cl, fn, wq); | 
 | } | 
 |  | 
 | #endif /* _LINUX_CLOSURE_H */ |