source: mainline/kernel/generic/src/synch/futex.c@ 38dc82d

lfn serial ticket/834-toolchain-update topic/msim-upgrade topic/simplify-dev-export
Last change on this file since 38dc82d was 38dc82d, checked in by Jakub Jermar <jakub@…>, 9 years ago

Make page_mapping_find() return a copy rather than the actual PTE

This makes page_mapping_find() more suitable for use with lock-free data
structures such as CHT that guarantee existence of the data only for
some limited time while a condition holds (e.g. inside of a RCU-protected
critical section that must be around all CHT lookups).

  • Property mode set to 100644
File size: 14.1 KB
RevLine 
[9aa72b4]1/*
[df4ed85]2 * Copyright (c) 2006 Jakub Jermar
[669f3d32]3 * Copyright (c) 2012 Adam Hraska
[9aa72b4]4 * All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
8 * are met:
9 *
10 * - Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * - Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 * - The name of the author may not be used to endorse or promote products
16 * derived from this software without specific prior written permission.
17 *
18 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
19 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
20 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
21 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
22 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
23 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
27 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 */
29
[cc73a8a1]30/** @addtogroup sync
[b45c443]31 * @{
32 */
33
[9aa72b4]34/**
[b45c443]35 * @file
[cf26ba9]36 * @brief Kernel backend for futexes.
[ba368a6]37 *
38 * Kernel futex objects are stored in a global hash table futex_ht
39 * where the physical address of the futex variable (futex_t.paddr)
40 * is used as the lookup key. As a result multiple address spaces
41 * may share the same futex variable.
42 *
43 * A kernel futex object is created the first time a task accesses
44 * the futex (having a futex variable at a physical address not
45 * encountered before). Futex object's lifetime is governed by
46 * a reference count that represents the number of all the different
47 * user space virtual addresses from all tasks that map to the
48 * physical address of the futex variable. A futex object is freed
49 * when the last task having accessed the futex exits.
50 *
51 * Each task keeps track of the futex objects it accessed in a list
52 * of pointers (futex_ptr_t, task->futex_list) to the different futex
53 * objects.
54 *
55 * To speed up translation of futex variables' virtual addresses
56 * to their physical addresses, futex pointers accessed by the
57 * task are furthermore stored in a concurrent hash table (CHT,
58 * task->futexes->ht). A single lookup without locks or accesses
59 * to the page table translates a futex variable's virtual address
60 * into its futex kernel object.
[9aa72b4]61 */
62
63#include <synch/futex.h>
[ee42e43]64#include <synch/mutex.h>
[303c94c]65#include <synch/spinlock.h>
[669f3d32]66#include <synch/rcu.h>
[9aa72b4]67#include <mm/frame.h>
68#include <mm/page.h>
69#include <mm/slab.h>
[303c94c]70#include <proc/thread.h>
[4fded58]71#include <proc/task.h>
[9aa72b4]72#include <genarch/mm/page_pt.h>
73#include <genarch/mm/page_ht.h>
[669f3d32]74#include <adt/cht.h>
[9aa72b4]75#include <adt/hash_table.h>
76#include <adt/list.h>
77#include <arch.h>
78#include <align.h>
79#include <panic.h>
80#include <errno.h>
81
82#define FUTEX_HT_SIZE 1024 /* keep it a power of 2 */
83
[669f3d32]84/** Task specific pointer to a global kernel futex object. */
85typedef struct futex_ptr {
86 /** CHT link. */
87 cht_link_t cht_link;
88 /** List of all futex pointers used by the task. */
89 link_t all_link;
90 /** Kernel futex object. */
91 futex_t *futex;
92 /** User space virtual address of the futex variable in the task. */
93 uintptr_t uaddr;
94} futex_ptr_t;
95
96
97static void destroy_task_cache(work_t *work);
98
99static void futex_initialize(futex_t *futex, uintptr_t paddr);
100static void futex_add_ref(futex_t *futex);
101static void futex_release_ref(futex_t *futex);
102static void futex_release_ref_locked(futex_t *futex);
103
104static futex_t *get_futex(uintptr_t uaddr);
105static futex_t *find_cached_futex(uintptr_t uaddr);
106static futex_t *get_and_cache_futex(uintptr_t phys_addr, uintptr_t uaddr);
107static bool find_futex_paddr(uintptr_t uaddr, uintptr_t *phys_addr);
[9aa72b4]108
[96b02eb9]109static size_t futex_ht_hash(sysarg_t *key);
110static bool futex_ht_compare(sysarg_t *key, size_t keys, link_t *item);
[9aa72b4]111static void futex_ht_remove_callback(link_t *item);
112
[669f3d32]113static size_t task_fut_ht_hash(const cht_link_t *link);
114static size_t task_fut_ht_key_hash(void *key);
115static bool task_fut_ht_equal(const cht_link_t *item1, const cht_link_t *item2);
116static bool task_fut_ht_key_equal(void *key, const cht_link_t *item);
117
118
119/** Mutex protecting the global futex hash table.
120 *
121 * Acquire task specific TASK->futex_list_lock before this mutex.
[4fded58]122 */
[207e8880]123SPINLOCK_STATIC_INITIALIZE_NAME(futex_ht_lock, "futex-ht-lock");
[9aa72b4]124
[669f3d32]125/** Global kernel futex hash table. Lock futex_ht_lock before accessing.
126 *
127 * Physical address of the futex variable is the lookup key.
128 */
[9aa72b4]129static hash_table_t futex_ht;
130
[669f3d32]131/** Global kernel futex hash table operations. */
[9aa72b4]132static hash_table_operations_t futex_ht_ops = {
133 .hash = futex_ht_hash,
134 .compare = futex_ht_compare,
135 .remove_callback = futex_ht_remove_callback
136};
137
[669f3d32]138/** Task futex cache CHT operations. */
139static cht_ops_t task_futex_ht_ops = {
140 .hash = task_fut_ht_hash,
141 .key_hash = task_fut_ht_key_hash,
142 .equal = task_fut_ht_equal,
143 .key_equal = task_fut_ht_key_equal,
144 .remove_callback = NULL
145};
146
[9aa72b4]147/** Initialize futex subsystem. */
148void futex_init(void)
149{
150 hash_table_create(&futex_ht, FUTEX_HT_SIZE, 1, &futex_ht_ops);
151}
152
[669f3d32]153/** Initializes the futex structures for the new task. */
154void futex_task_init(struct task *task)
155{
156 task->futexes = malloc(sizeof(struct futex_cache), 0);
157
[c28413a9]158 cht_create(&task->futexes->ht, 0, 0, 0, true, &task_futex_ht_ops);
[3ac5086]159
160 list_initialize(&task->futexes->list);
[207e8880]161 spinlock_initialize(&task->futexes->list_lock, "futex-list-lock");
[669f3d32]162}
163
164/** Destroys the futex structures for the dying task. */
[3ac5086]165void futex_task_deinit(task_t *task)
[669f3d32]166{
167 /* Interrupts are disabled so we must not block (cannot run cht_destroy). */
168 if (interrupts_disabled()) {
169 /* Invoke the blocking cht_destroy in the background. */
170 workq_global_enqueue_noblock(&task->futexes->destroy_work,
171 destroy_task_cache);
172 } else {
173 /* We can block. Invoke cht_destroy in this thread. */
174 destroy_task_cache(&task->futexes->destroy_work);
175 }
176}
177
178/** Deallocates a task's CHT futex cache (must already be empty). */
179static void destroy_task_cache(work_t *work)
180{
181 struct futex_cache *cache =
182 member_to_inst(work, struct futex_cache, destroy_work);
183
[3ac5086]184 /*
185 * Destroy the cache before manually freeing items of the cache in case
186 * table resize is in progress.
187 */
188 cht_destroy_unsafe(&cache->ht);
189
190 /* Manually free futex_ptr cache items. */
191 list_foreach_safe(cache->list, cur_link, next_link) {
192 futex_ptr_t *fut_ptr = member_to_inst(cur_link, futex_ptr_t, all_link);
193
194 list_remove(cur_link);
195 free(fut_ptr);
196 }
197
[669f3d32]198 free(cache);
199}
200
201/** Remove references from futexes known to the current task. */
202void futex_task_cleanup(void)
203{
[3ac5086]204 struct futex_cache *futexes = TASK->futexes;
205
[669f3d32]206 /* All threads of this task have terminated. This is the last thread. */
[207e8880]207 spinlock_lock(&futexes->list_lock);
[669f3d32]208
[3ac5086]209 list_foreach_safe(futexes->list, cur_link, next_link) {
210 futex_ptr_t *fut_ptr = member_to_inst(cur_link, futex_ptr_t, all_link);
211
[669f3d32]212 /*
213 * The function is free to free the futex. All other threads of this
214 * task have already terminated, so they have also definitely
215 * exited their CHT futex cache protecting rcu reader sections.
216 * Moreover release_ref() only frees the futex if this is the
217 * last task referencing the futex. Therefore, only threads
218 * of this task may have referenced the futex if it is to be freed.
219 */
220 futex_release_ref_locked(fut_ptr->futex);
221 }
222
[207e8880]223 spinlock_unlock(&futexes->list_lock);
[669f3d32]224}
225
226
227/** Initialize the kernel futex structure.
[9aa72b4]228 *
[669f3d32]229 * @param futex Kernel futex structure.
230 * @param paddr Physical address of the futex variable.
[9aa72b4]231 */
[669f3d32]232static void futex_initialize(futex_t *futex, uintptr_t paddr)
[9aa72b4]233{
234 waitq_initialize(&futex->wq);
235 link_initialize(&futex->ht_link);
[669f3d32]236 futex->paddr = paddr;
[4fded58]237 futex->refcount = 1;
[9aa72b4]238}
239
[669f3d32]240/** Increments the counter of tasks referencing the futex. */
241static void futex_add_ref(futex_t *futex)
242{
[207e8880]243 ASSERT(spinlock_locked(&futex_ht_lock));
[669f3d32]244 ASSERT(0 < futex->refcount);
245 ++futex->refcount;
246}
247
248/** Decrements the counter of tasks referencing the futex. May free the futex.*/
249static void futex_release_ref(futex_t *futex)
250{
[207e8880]251 ASSERT(spinlock_locked(&futex_ht_lock));
[669f3d32]252 ASSERT(0 < futex->refcount);
253
254 --futex->refcount;
255
256 if (0 == futex->refcount) {
257 hash_table_remove(&futex_ht, &futex->paddr, 1);
258 }
259}
260
261/** Decrements the counter of tasks referencing the futex. May free the futex.*/
262static void futex_release_ref_locked(futex_t *futex)
263{
[207e8880]264 spinlock_lock(&futex_ht_lock);
[669f3d32]265 futex_release_ref(futex);
[207e8880]266 spinlock_unlock(&futex_ht_lock);
[669f3d32]267}
268
269/** Returns a futex for the virtual address @a uaddr (or creates one). */
270static futex_t *get_futex(uintptr_t uaddr)
271{
272 futex_t *futex = find_cached_futex(uaddr);
273
274 if (futex)
275 return futex;
276
277 uintptr_t paddr;
278
[207e8880]279 if (!find_futex_paddr(uaddr, &paddr)) {
[669f3d32]280 return 0;
[207e8880]281 }
[669f3d32]282
283 return get_and_cache_futex(paddr, uaddr);
284}
285
286
287/** Finds the physical address of the futex variable. */
288static bool find_futex_paddr(uintptr_t uaddr, uintptr_t *paddr)
289{
[207e8880]290 page_table_lock(AS, false);
[759ea0d]291 spinlock_lock(&futex_ht_lock);
[669f3d32]292
[38dc82d]293 bool success = false;
294
295 pte_t t;
296 bool found;
297
298 found = page_mapping_find(AS, ALIGN_DOWN(uaddr, PAGE_SIZE), true, &t);
299 if (found && PTE_VALID(&t) && PTE_PRESENT(&t)) {
300 success = true;
301 *paddr = PTE_GET_FRAME(&t) +
302 (uaddr - ALIGN_DOWN(uaddr, PAGE_SIZE));
[669f3d32]303 }
304
[207e8880]305 spinlock_unlock(&futex_ht_lock);
[759ea0d]306 page_table_unlock(AS, false);
[669f3d32]307
[38dc82d]308 return success;
[669f3d32]309}
310
311/** Returns the futex cached in this task with the virtual address uaddr. */
312static futex_t *find_cached_futex(uintptr_t uaddr)
313{
314 cht_read_lock();
315
316 futex_t *futex;
[c0c26ac]317 cht_link_t *futex_ptr_link = cht_find_lazy(&TASK->futexes->ht, &uaddr);
[669f3d32]318
319 if (futex_ptr_link) {
320 futex_ptr_t *futex_ptr
321 = member_to_inst(futex_ptr_link, futex_ptr_t, cht_link);
322
323 futex = futex_ptr->futex;
324 } else {
325 futex = NULL;
326 }
327
328 cht_read_unlock();
329
330 return futex;
331}
332
333
334/**
335 * Returns a kernel futex for the physical address @a phys_addr and caches
336 * it in this task under the virtual address @a uaddr (if not already cached).
337 */
338static futex_t *get_and_cache_futex(uintptr_t phys_addr, uintptr_t uaddr)
339{
340 futex_t *futex = malloc(sizeof(futex_t), 0);
341
342 /*
343 * Find the futex object in the global futex table (or insert it
344 * if it is not present).
345 */
[207e8880]346 spinlock_lock(&futex_ht_lock);
[669f3d32]347
348 link_t *fut_link = hash_table_find(&futex_ht, &phys_addr);
349
350 if (fut_link) {
351 free(futex);
352 futex = member_to_inst(fut_link, futex_t, ht_link);
353 futex_add_ref(futex);
354 } else {
355 futex_initialize(futex, phys_addr);
356 hash_table_insert(&futex_ht, &phys_addr, &futex->ht_link);
357 }
358
[207e8880]359 spinlock_unlock(&futex_ht_lock);
[669f3d32]360
361 /*
362 * Cache the link to the futex object for this task.
363 */
364 futex_ptr_t *fut_ptr = malloc(sizeof(futex_ptr_t), 0);
365 cht_link_t *dup_link;
366
367 fut_ptr->futex = futex;
368 fut_ptr->uaddr = uaddr;
369
370 cht_read_lock();
371
372 /* Cache the mapping from the virtual address to the futex for this task. */
373 if (cht_insert_unique(&TASK->futexes->ht, &fut_ptr->cht_link, &dup_link)) {
[207e8880]374 spinlock_lock(&TASK->futexes->list_lock);
[3ac5086]375 list_append(&fut_ptr->all_link, &TASK->futexes->list);
[207e8880]376 spinlock_unlock(&TASK->futexes->list_lock);
[669f3d32]377 } else {
378 /* Another thread of this task beat us to it. Use that mapping instead.*/
379 free(fut_ptr);
380 futex_release_ref_locked(futex);
381
382 futex_ptr_t *dup = member_to_inst(dup_link, futex_ptr_t, cht_link);
383 futex = dup->futex;
384 }
385
386 cht_read_unlock();
387
388 return futex;
389}
390
[9aa72b4]391/** Sleep in futex wait queue.
392 *
[4774a32]393 * @param uaddr Userspace address of the futex counter.
[9aa72b4]394 *
[4774a32]395 * @return If there is no physical mapping for uaddr ENOENT is
396 * returned. Otherwise returns a wait result as defined in
397 * synch.h.
[9aa72b4]398 */
[96b02eb9]399sysarg_t sys_futex_sleep(uintptr_t uaddr)
[9aa72b4]400{
[669f3d32]401 futex_t *futex = get_futex(uaddr);
[9aa72b4]402
[669f3d32]403 if (!futex)
[96b02eb9]404 return (sysarg_t) ENOENT;
[741fd16]405
[496232e]406#ifdef CONFIG_UDEBUG
407 udebug_stoppable_begin();
408#endif
409
[669f3d32]410 int rc = waitq_sleep_timeout(&futex->wq, 0, SYNCH_FLAGS_INTERRUPTIBLE);
[207e8880]411
[496232e]412#ifdef CONFIG_UDEBUG
413 udebug_stoppable_end();
414#endif
415
[96b02eb9]416 return (sysarg_t) rc;
[9aa72b4]417}
418
419/** Wakeup one thread waiting in futex wait queue.
420 *
[4774a32]421 * @param uaddr Userspace address of the futex counter.
[9aa72b4]422 *
[4774a32]423 * @return ENOENT if there is no physical mapping for uaddr.
[9aa72b4]424 */
[96b02eb9]425sysarg_t sys_futex_wakeup(uintptr_t uaddr)
[9aa72b4]426{
[669f3d32]427 futex_t *futex = get_futex(uaddr);
[9aa72b4]428
[669f3d32]429 if (futex) {
430 waitq_wakeup(&futex->wq, WAKEUP_FIRST);
431 return 0;
432 } else {
[96b02eb9]433 return (sysarg_t) ENOENT;
[9aa72b4]434 }
[a9ef68b]435}
436
[9aa72b4]437
438/** Compute hash index into futex hash table.
439 *
[4774a32]440 * @param key Address where the key (i.e. physical address of futex
441 * counter) is stored.
[9aa72b4]442 *
[4774a32]443 * @return Index into futex hash table.
[9aa72b4]444 */
[96b02eb9]445size_t futex_ht_hash(sysarg_t *key)
[9aa72b4]446{
[98000fb]447 return (*key & (FUTEX_HT_SIZE - 1));
[9aa72b4]448}
449
450/** Compare futex hash table item with a key.
451 *
[4774a32]452 * @param key Address where the key (i.e. physical address of futex
453 * counter) is stored.
[9aa72b4]454 *
[4774a32]455 * @return True if the item matches the key. False otherwise.
[9aa72b4]456 */
[96b02eb9]457bool futex_ht_compare(sysarg_t *key, size_t keys, link_t *item)
[9aa72b4]458{
459 futex_t *futex;
460
461 ASSERT(keys == 1);
462
463 futex = hash_table_get_instance(item, futex_t, ht_link);
464 return *key == futex->paddr;
465}
466
467/** Callback for removal items from futex hash table.
468 *
[4774a32]469 * @param item Item removed from the hash table.
[9aa72b4]470 */
471void futex_ht_remove_callback(link_t *item)
472{
473 futex_t *futex;
474
475 futex = hash_table_get_instance(item, futex_t, ht_link);
476 free(futex);
477}
[e090e1bc]478
[669f3d32]479/*
480 * Operations of a task's CHT that caches mappings of futex user space
481 * virtual addresses to kernel futex objects.
482 */
483
484static size_t task_fut_ht_hash(const cht_link_t *link)
[e090e1bc]485{
[669f3d32]486 const futex_ptr_t *fut_ptr = member_to_inst(link, futex_ptr_t, cht_link);
487 return fut_ptr->uaddr;
488}
[9c1c6771]489
[669f3d32]490static size_t task_fut_ht_key_hash(void *key)
491{
492 return *(uintptr_t*)key;
493}
494
495static bool task_fut_ht_equal(const cht_link_t *item1, const cht_link_t *item2)
496{
497 const futex_ptr_t *fut_ptr1 = member_to_inst(item1, futex_ptr_t, cht_link);
498 const futex_ptr_t *fut_ptr2 = member_to_inst(item2, futex_ptr_t, cht_link);
[9c1c6771]499
[669f3d32]500 return fut_ptr1->uaddr == fut_ptr2->uaddr;
[e090e1bc]501}
[b45c443]502
[669f3d32]503static bool task_fut_ht_key_equal(void *key, const cht_link_t *item)
504{
505 const futex_ptr_t *fut_ptr = member_to_inst(item, futex_ptr_t, cht_link);
506 uintptr_t uaddr = *(uintptr_t*)key;
[9c1c6771]507
[669f3d32]508 return fut_ptr->uaddr == uaddr;
[e090e1bc]509}
[b45c443]510
[cc73a8a1]511/** @}
[b45c443]512 */
Note: See TracBrowser for help on using the repository browser.