source: mainline/kernel/generic/src/synch/futex.c@ 38dc82d

lfn serial ticket/834-toolchain-update topic/msim-upgrade topic/simplify-dev-export
Last change on this file since 38dc82d was 38dc82d, checked in by Jakub Jermar <jakub@…>, 9 years ago

Make page_mapping_find() return a copy rather than the actual PTE

This makes page_mapping_find() more suitable for use with lock-free data
structures such as CHT that guarantee existence of the data only for
some limited time while a condition holds (e.g. inside of a RCU-protected
critical section that must be around all CHT lookups).

  • Property mode set to 100644
File size: 14.1 KB
Line 
1/*
2 * Copyright (c) 2006 Jakub Jermar
3 * Copyright (c) 2012 Adam Hraska
4 * All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
8 * are met:
9 *
10 * - Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * - Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 * - The name of the author may not be used to endorse or promote products
16 * derived from this software without specific prior written permission.
17 *
18 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
19 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
20 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
21 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
22 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
23 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
27 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 */
29
30/** @addtogroup sync
31 * @{
32 */
33
34/**
35 * @file
36 * @brief Kernel backend for futexes.
37 *
38 * Kernel futex objects are stored in a global hash table futex_ht
39 * where the physical address of the futex variable (futex_t.paddr)
40 * is used as the lookup key. As a result multiple address spaces
41 * may share the same futex variable.
42 *
43 * A kernel futex object is created the first time a task accesses
44 * the futex (having a futex variable at a physical address not
45 * encountered before). Futex object's lifetime is governed by
46 * a reference count that represents the number of all the different
47 * user space virtual addresses from all tasks that map to the
48 * physical address of the futex variable. A futex object is freed
49 * when the last task having accessed the futex exits.
50 *
51 * Each task keeps track of the futex objects it accessed in a list
52 * of pointers (futex_ptr_t, task->futex_list) to the different futex
53 * objects.
54 *
55 * To speed up translation of futex variables' virtual addresses
56 * to their physical addresses, futex pointers accessed by the
57 * task are furthermore stored in a concurrent hash table (CHT,
58 * task->futexes->ht). A single lookup without locks or accesses
59 * to the page table translates a futex variable's virtual address
60 * into its futex kernel object.
61 */
62
63#include <synch/futex.h>
64#include <synch/mutex.h>
65#include <synch/spinlock.h>
66#include <synch/rcu.h>
67#include <mm/frame.h>
68#include <mm/page.h>
69#include <mm/slab.h>
70#include <proc/thread.h>
71#include <proc/task.h>
72#include <genarch/mm/page_pt.h>
73#include <genarch/mm/page_ht.h>
74#include <adt/cht.h>
75#include <adt/hash_table.h>
76#include <adt/list.h>
77#include <arch.h>
78#include <align.h>
79#include <panic.h>
80#include <errno.h>
81
82#define FUTEX_HT_SIZE 1024 /* keep it a power of 2 */
83
84/** Task specific pointer to a global kernel futex object. */
85typedef struct futex_ptr {
86 /** CHT link. */
87 cht_link_t cht_link;
88 /** List of all futex pointers used by the task. */
89 link_t all_link;
90 /** Kernel futex object. */
91 futex_t *futex;
92 /** User space virtual address of the futex variable in the task. */
93 uintptr_t uaddr;
94} futex_ptr_t;
95
96
97static void destroy_task_cache(work_t *work);
98
99static void futex_initialize(futex_t *futex, uintptr_t paddr);
100static void futex_add_ref(futex_t *futex);
101static void futex_release_ref(futex_t *futex);
102static void futex_release_ref_locked(futex_t *futex);
103
104static futex_t *get_futex(uintptr_t uaddr);
105static futex_t *find_cached_futex(uintptr_t uaddr);
106static futex_t *get_and_cache_futex(uintptr_t phys_addr, uintptr_t uaddr);
107static bool find_futex_paddr(uintptr_t uaddr, uintptr_t *phys_addr);
108
109static size_t futex_ht_hash(sysarg_t *key);
110static bool futex_ht_compare(sysarg_t *key, size_t keys, link_t *item);
111static void futex_ht_remove_callback(link_t *item);
112
113static size_t task_fut_ht_hash(const cht_link_t *link);
114static size_t task_fut_ht_key_hash(void *key);
115static bool task_fut_ht_equal(const cht_link_t *item1, const cht_link_t *item2);
116static bool task_fut_ht_key_equal(void *key, const cht_link_t *item);
117
118
119/** Mutex protecting the global futex hash table.
120 *
121 * Acquire task specific TASK->futex_list_lock before this mutex.
122 */
123SPINLOCK_STATIC_INITIALIZE_NAME(futex_ht_lock, "futex-ht-lock");
124
125/** Global kernel futex hash table. Lock futex_ht_lock before accessing.
126 *
127 * Physical address of the futex variable is the lookup key.
128 */
129static hash_table_t futex_ht;
130
131/** Global kernel futex hash table operations. */
132static hash_table_operations_t futex_ht_ops = {
133 .hash = futex_ht_hash,
134 .compare = futex_ht_compare,
135 .remove_callback = futex_ht_remove_callback
136};
137
138/** Task futex cache CHT operations. */
139static cht_ops_t task_futex_ht_ops = {
140 .hash = task_fut_ht_hash,
141 .key_hash = task_fut_ht_key_hash,
142 .equal = task_fut_ht_equal,
143 .key_equal = task_fut_ht_key_equal,
144 .remove_callback = NULL
145};
146
147/** Initialize futex subsystem. */
148void futex_init(void)
149{
150 hash_table_create(&futex_ht, FUTEX_HT_SIZE, 1, &futex_ht_ops);
151}
152
153/** Initializes the futex structures for the new task. */
154void futex_task_init(struct task *task)
155{
156 task->futexes = malloc(sizeof(struct futex_cache), 0);
157
158 cht_create(&task->futexes->ht, 0, 0, 0, true, &task_futex_ht_ops);
159
160 list_initialize(&task->futexes->list);
161 spinlock_initialize(&task->futexes->list_lock, "futex-list-lock");
162}
163
164/** Destroys the futex structures for the dying task. */
165void futex_task_deinit(task_t *task)
166{
167 /* Interrupts are disabled so we must not block (cannot run cht_destroy). */
168 if (interrupts_disabled()) {
169 /* Invoke the blocking cht_destroy in the background. */
170 workq_global_enqueue_noblock(&task->futexes->destroy_work,
171 destroy_task_cache);
172 } else {
173 /* We can block. Invoke cht_destroy in this thread. */
174 destroy_task_cache(&task->futexes->destroy_work);
175 }
176}
177
178/** Deallocates a task's CHT futex cache (must already be empty). */
179static void destroy_task_cache(work_t *work)
180{
181 struct futex_cache *cache =
182 member_to_inst(work, struct futex_cache, destroy_work);
183
184 /*
185 * Destroy the cache before manually freeing items of the cache in case
186 * table resize is in progress.
187 */
188 cht_destroy_unsafe(&cache->ht);
189
190 /* Manually free futex_ptr cache items. */
191 list_foreach_safe(cache->list, cur_link, next_link) {
192 futex_ptr_t *fut_ptr = member_to_inst(cur_link, futex_ptr_t, all_link);
193
194 list_remove(cur_link);
195 free(fut_ptr);
196 }
197
198 free(cache);
199}
200
201/** Remove references from futexes known to the current task. */
202void futex_task_cleanup(void)
203{
204 struct futex_cache *futexes = TASK->futexes;
205
206 /* All threads of this task have terminated. This is the last thread. */
207 spinlock_lock(&futexes->list_lock);
208
209 list_foreach_safe(futexes->list, cur_link, next_link) {
210 futex_ptr_t *fut_ptr = member_to_inst(cur_link, futex_ptr_t, all_link);
211
212 /*
213 * The function is free to free the futex. All other threads of this
214 * task have already terminated, so they have also definitely
215 * exited their CHT futex cache protecting rcu reader sections.
216 * Moreover release_ref() only frees the futex if this is the
217 * last task referencing the futex. Therefore, only threads
218 * of this task may have referenced the futex if it is to be freed.
219 */
220 futex_release_ref_locked(fut_ptr->futex);
221 }
222
223 spinlock_unlock(&futexes->list_lock);
224}
225
226
227/** Initialize the kernel futex structure.
228 *
229 * @param futex Kernel futex structure.
230 * @param paddr Physical address of the futex variable.
231 */
232static void futex_initialize(futex_t *futex, uintptr_t paddr)
233{
234 waitq_initialize(&futex->wq);
235 link_initialize(&futex->ht_link);
236 futex->paddr = paddr;
237 futex->refcount = 1;
238}
239
240/** Increments the counter of tasks referencing the futex. */
241static void futex_add_ref(futex_t *futex)
242{
243 ASSERT(spinlock_locked(&futex_ht_lock));
244 ASSERT(0 < futex->refcount);
245 ++futex->refcount;
246}
247
248/** Decrements the counter of tasks referencing the futex. May free the futex.*/
249static void futex_release_ref(futex_t *futex)
250{
251 ASSERT(spinlock_locked(&futex_ht_lock));
252 ASSERT(0 < futex->refcount);
253
254 --futex->refcount;
255
256 if (0 == futex->refcount) {
257 hash_table_remove(&futex_ht, &futex->paddr, 1);
258 }
259}
260
261/** Decrements the counter of tasks referencing the futex. May free the futex.*/
262static void futex_release_ref_locked(futex_t *futex)
263{
264 spinlock_lock(&futex_ht_lock);
265 futex_release_ref(futex);
266 spinlock_unlock(&futex_ht_lock);
267}
268
269/** Returns a futex for the virtual address @a uaddr (or creates one). */
270static futex_t *get_futex(uintptr_t uaddr)
271{
272 futex_t *futex = find_cached_futex(uaddr);
273
274 if (futex)
275 return futex;
276
277 uintptr_t paddr;
278
279 if (!find_futex_paddr(uaddr, &paddr)) {
280 return 0;
281 }
282
283 return get_and_cache_futex(paddr, uaddr);
284}
285
286
287/** Finds the physical address of the futex variable. */
288static bool find_futex_paddr(uintptr_t uaddr, uintptr_t *paddr)
289{
290 page_table_lock(AS, false);
291 spinlock_lock(&futex_ht_lock);
292
293 bool success = false;
294
295 pte_t t;
296 bool found;
297
298 found = page_mapping_find(AS, ALIGN_DOWN(uaddr, PAGE_SIZE), true, &t);
299 if (found && PTE_VALID(&t) && PTE_PRESENT(&t)) {
300 success = true;
301 *paddr = PTE_GET_FRAME(&t) +
302 (uaddr - ALIGN_DOWN(uaddr, PAGE_SIZE));
303 }
304
305 spinlock_unlock(&futex_ht_lock);
306 page_table_unlock(AS, false);
307
308 return success;
309}
310
311/** Returns the futex cached in this task with the virtual address uaddr. */
312static futex_t *find_cached_futex(uintptr_t uaddr)
313{
314 cht_read_lock();
315
316 futex_t *futex;
317 cht_link_t *futex_ptr_link = cht_find_lazy(&TASK->futexes->ht, &uaddr);
318
319 if (futex_ptr_link) {
320 futex_ptr_t *futex_ptr
321 = member_to_inst(futex_ptr_link, futex_ptr_t, cht_link);
322
323 futex = futex_ptr->futex;
324 } else {
325 futex = NULL;
326 }
327
328 cht_read_unlock();
329
330 return futex;
331}
332
333
334/**
335 * Returns a kernel futex for the physical address @a phys_addr and caches
336 * it in this task under the virtual address @a uaddr (if not already cached).
337 */
338static futex_t *get_and_cache_futex(uintptr_t phys_addr, uintptr_t uaddr)
339{
340 futex_t *futex = malloc(sizeof(futex_t), 0);
341
342 /*
343 * Find the futex object in the global futex table (or insert it
344 * if it is not present).
345 */
346 spinlock_lock(&futex_ht_lock);
347
348 link_t *fut_link = hash_table_find(&futex_ht, &phys_addr);
349
350 if (fut_link) {
351 free(futex);
352 futex = member_to_inst(fut_link, futex_t, ht_link);
353 futex_add_ref(futex);
354 } else {
355 futex_initialize(futex, phys_addr);
356 hash_table_insert(&futex_ht, &phys_addr, &futex->ht_link);
357 }
358
359 spinlock_unlock(&futex_ht_lock);
360
361 /*
362 * Cache the link to the futex object for this task.
363 */
364 futex_ptr_t *fut_ptr = malloc(sizeof(futex_ptr_t), 0);
365 cht_link_t *dup_link;
366
367 fut_ptr->futex = futex;
368 fut_ptr->uaddr = uaddr;
369
370 cht_read_lock();
371
372 /* Cache the mapping from the virtual address to the futex for this task. */
373 if (cht_insert_unique(&TASK->futexes->ht, &fut_ptr->cht_link, &dup_link)) {
374 spinlock_lock(&TASK->futexes->list_lock);
375 list_append(&fut_ptr->all_link, &TASK->futexes->list);
376 spinlock_unlock(&TASK->futexes->list_lock);
377 } else {
378 /* Another thread of this task beat us to it. Use that mapping instead.*/
379 free(fut_ptr);
380 futex_release_ref_locked(futex);
381
382 futex_ptr_t *dup = member_to_inst(dup_link, futex_ptr_t, cht_link);
383 futex = dup->futex;
384 }
385
386 cht_read_unlock();
387
388 return futex;
389}
390
391/** Sleep in futex wait queue.
392 *
393 * @param uaddr Userspace address of the futex counter.
394 *
395 * @return If there is no physical mapping for uaddr ENOENT is
396 * returned. Otherwise returns a wait result as defined in
397 * synch.h.
398 */
399sysarg_t sys_futex_sleep(uintptr_t uaddr)
400{
401 futex_t *futex = get_futex(uaddr);
402
403 if (!futex)
404 return (sysarg_t) ENOENT;
405
406#ifdef CONFIG_UDEBUG
407 udebug_stoppable_begin();
408#endif
409
410 int rc = waitq_sleep_timeout(&futex->wq, 0, SYNCH_FLAGS_INTERRUPTIBLE);
411
412#ifdef CONFIG_UDEBUG
413 udebug_stoppable_end();
414#endif
415
416 return (sysarg_t) rc;
417}
418
419/** Wakeup one thread waiting in futex wait queue.
420 *
421 * @param uaddr Userspace address of the futex counter.
422 *
423 * @return ENOENT if there is no physical mapping for uaddr.
424 */
425sysarg_t sys_futex_wakeup(uintptr_t uaddr)
426{
427 futex_t *futex = get_futex(uaddr);
428
429 if (futex) {
430 waitq_wakeup(&futex->wq, WAKEUP_FIRST);
431 return 0;
432 } else {
433 return (sysarg_t) ENOENT;
434 }
435}
436
437
438/** Compute hash index into futex hash table.
439 *
440 * @param key Address where the key (i.e. physical address of futex
441 * counter) is stored.
442 *
443 * @return Index into futex hash table.
444 */
445size_t futex_ht_hash(sysarg_t *key)
446{
447 return (*key & (FUTEX_HT_SIZE - 1));
448}
449
450/** Compare futex hash table item with a key.
451 *
452 * @param key Address where the key (i.e. physical address of futex
453 * counter) is stored.
454 *
455 * @return True if the item matches the key. False otherwise.
456 */
457bool futex_ht_compare(sysarg_t *key, size_t keys, link_t *item)
458{
459 futex_t *futex;
460
461 ASSERT(keys == 1);
462
463 futex = hash_table_get_instance(item, futex_t, ht_link);
464 return *key == futex->paddr;
465}
466
467/** Callback for removal items from futex hash table.
468 *
469 * @param item Item removed from the hash table.
470 */
471void futex_ht_remove_callback(link_t *item)
472{
473 futex_t *futex;
474
475 futex = hash_table_get_instance(item, futex_t, ht_link);
476 free(futex);
477}
478
479/*
480 * Operations of a task's CHT that caches mappings of futex user space
481 * virtual addresses to kernel futex objects.
482 */
483
484static size_t task_fut_ht_hash(const cht_link_t *link)
485{
486 const futex_ptr_t *fut_ptr = member_to_inst(link, futex_ptr_t, cht_link);
487 return fut_ptr->uaddr;
488}
489
490static size_t task_fut_ht_key_hash(void *key)
491{
492 return *(uintptr_t*)key;
493}
494
495static bool task_fut_ht_equal(const cht_link_t *item1, const cht_link_t *item2)
496{
497 const futex_ptr_t *fut_ptr1 = member_to_inst(item1, futex_ptr_t, cht_link);
498 const futex_ptr_t *fut_ptr2 = member_to_inst(item2, futex_ptr_t, cht_link);
499
500 return fut_ptr1->uaddr == fut_ptr2->uaddr;
501}
502
503static bool task_fut_ht_key_equal(void *key, const cht_link_t *item)
504{
505 const futex_ptr_t *fut_ptr = member_to_inst(item, futex_ptr_t, cht_link);
506 uintptr_t uaddr = *(uintptr_t*)key;
507
508 return fut_ptr->uaddr == uaddr;
509}
510
511/** @}
512 */
Note: See TracBrowser for help on using the repository browser.