Update.
[glibc.git] / nptl / allocatestack.c
blob59f00d9231cdae84fba17b216dd8b3b524cfee1e
1 /* Copyright (C) 2002, 2003, 2004 Free Software Foundation, Inc.
2 This file is part of the GNU C Library.
3 Contributed by Ulrich Drepper <drepper@redhat.com>, 2002.
5 The GNU C Library is free software; you can redistribute it and/or
6 modify it under the terms of the GNU Lesser General Public
7 License as published by the Free Software Foundation; either
8 version 2.1 of the License, or (at your option) any later version.
10 The GNU C Library is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 Lesser General Public License for more details.
15 You should have received a copy of the GNU Lesser General Public
16 License along with the GNU C Library; if not, write to the Free
17 Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
18 02111-1307 USA. */
20 #include <assert.h>
21 #include <errno.h>
22 #include <stdint.h>
23 #include <string.h>
24 #include <unistd.h>
25 #include <sys/mman.h>
26 #include <sys/param.h>
27 #include <dl-sysdep.h>
28 #include <tls.h>
32 #ifndef NEED_SEPARATE_REGISTER_STACK
34 /* Most architectures have exactly one stack pointer. Some have more. */
35 # define STACK_VARIABLES void *stackaddr
37 /* How to pass the values to the 'create_thread' function. */
38 # define STACK_VARIABLES_ARGS stackaddr
40 /* How to declare function which gets there parameters. */
41 # define STACK_VARIABLES_PARMS void *stackaddr
43 /* How to declare allocate_stack. */
44 # define ALLOCATE_STACK_PARMS void **stack
46 /* This is how the function is called. We do it this way to allow
47 other variants of the function to have more parameters. */
48 # define ALLOCATE_STACK(attr, pd) allocate_stack (attr, pd, &stackaddr)
50 #else
52 /* We need two stacks. The kernel will place them but we have to tell
53 the kernel about the size of the reserved address space. */
54 # define STACK_VARIABLES void *stackaddr; size_t stacksize
56 /* How to pass the values to the 'create_thread' function. */
57 # define STACK_VARIABLES_ARGS stackaddr, stacksize
59 /* How to declare function which gets there parameters. */
60 # define STACK_VARIABLES_PARMS void *stackaddr, size_t stacksize
62 /* How to declare allocate_stack. */
63 # define ALLOCATE_STACK_PARMS void **stack, size_t *stacksize
65 /* This is how the function is called. We do it this way to allow
66 other variants of the function to have more parameters. */
67 # define ALLOCATE_STACK(attr, pd) \
68 allocate_stack (attr, pd, &stackaddr, &stacksize)
70 #endif
73 /* Default alignment of stack. */
74 #ifndef STACK_ALIGN
75 # define STACK_ALIGN __alignof__ (long double)
76 #endif
78 /* Default value for minimal stack size after allocating thread
79 descriptor and guard. */
80 #ifndef MINIMAL_REST_STACK
81 # define MINIMAL_REST_STACK 4096
82 #endif
85 /* Let the architecture add some flags to the mmap() call used to
86 allocate stacks. */
87 #ifndef ARCH_MAP_FLAGS
88 # define ARCH_MAP_FLAGS 0
89 #endif
91 /* This yields the pointer that TLS support code calls the thread pointer. */
92 #if TLS_TCB_AT_TP
93 # define TLS_TPADJ(pd) (pd)
94 #elif TLS_DTV_AT_TP
95 # define TLS_TPADJ(pd) ((struct pthread *)((char *) (pd) + TLS_PRE_TCB_SIZE))
96 #endif
98 /* Cache handling for not-yet free stacks. */
100 /* Maximum size in kB of cache. */
101 static size_t stack_cache_maxsize = 40 * 1024 * 1024; /* 40MiBi by default. */
102 static size_t stack_cache_actsize;
104 /* Mutex protecting this variable. */
105 static lll_lock_t stack_cache_lock = LLL_LOCK_INITIALIZER;
107 /* List of queued stack frames. */
108 static LIST_HEAD (stack_cache);
110 /* List of the stacks in use. */
111 static LIST_HEAD (stack_used);
113 /* List of the threads with user provided stacks in use. No need to
114 initialize this, since it's done in __pthread_initialize_minimal. */
115 list_t __stack_user __attribute__ ((nocommon));
116 hidden_data_def (__stack_user)
118 #if COLORING_INCREMENT != 0
119 /* Number of threads created. */
120 static unsigned int nptl_ncreated;
121 #endif
124 /* Check whether the stack is still used or not. */
125 #define FREE_P(descr) ((descr)->tid <= 0)
128 /* We create a double linked list of all cache entries. Double linked
129 because this allows removing entries from the end. */
132 /* Get a stack frame from the cache. We have to match by size since
133 some blocks might be too small or far too large. */
134 static struct pthread *
135 get_cached_stack (size_t *sizep, void **memp)
137 size_t size = *sizep;
138 struct pthread *result = NULL;
139 list_t *entry;
141 lll_lock (stack_cache_lock);
143 /* Search the cache for a matching entry. We search for the
144 smallest stack which has at least the required size. Note that
145 in normal situations the size of all allocated stacks is the
146 same. As the very least there are only a few different sizes.
147 Therefore this loop will exit early most of the time with an
148 exact match. */
149 list_for_each (entry, &stack_cache)
151 struct pthread *curr;
153 curr = list_entry (entry, struct pthread, list);
154 if (FREE_P (curr) && curr->stackblock_size >= size)
156 if (curr->stackblock_size == size)
158 result = curr;
159 break;
162 if (result == NULL
163 || result->stackblock_size > curr->stackblock_size)
164 result = curr;
168 if (__builtin_expect (result == NULL, 0)
169 /* Make sure the size difference is not too excessive. In that
170 case we do not use the block. */
171 || __builtin_expect (result->stackblock_size > 4 * size, 0))
173 /* Release the lock. */
174 lll_unlock (stack_cache_lock);
176 return NULL;
179 /* Dequeue the entry. */
180 list_del (&result->list);
182 /* And add to the list of stacks in use. */
183 list_add (&result->list, &stack_used);
185 /* And decrease the cache size. */
186 stack_cache_actsize -= result->stackblock_size;
188 /* Release the lock early. */
189 lll_unlock (stack_cache_lock);
191 /* Report size and location of the stack to the caller. */
192 *sizep = result->stackblock_size;
193 *memp = result->stackblock;
195 /* Cancellation handling is back to the default. */
196 result->cancelhandling = 0;
197 result->cleanup = NULL;
199 /* No pending event. */
200 result->nextevent = NULL;
202 /* Clear the DTV. */
203 dtv_t *dtv = GET_DTV (TLS_TPADJ (result));
204 memset (dtv, '\0', (dtv[-1].counter + 1) * sizeof (dtv_t));
206 /* Re-initialize the TLS. */
207 _dl_allocate_tls_init (TLS_TPADJ (result));
209 return result;
213 /* Add a stack frame which is not used anymore to the stack. Must be
214 called with the cache lock held. */
215 static inline void
216 __attribute ((always_inline))
217 queue_stack (struct pthread *stack)
219 /* We unconditionally add the stack to the list. The memory may
220 still be in use but it will not be reused until the kernel marks
221 the stack as not used anymore. */
222 list_add (&stack->list, &stack_cache);
224 stack_cache_actsize += stack->stackblock_size;
225 if (__builtin_expect (stack_cache_actsize > stack_cache_maxsize, 0))
227 /* We reduce the size of the cache. Remove the last entries
228 until the size is below the limit. */
229 list_t *entry;
230 list_t *prev;
232 /* Search from the end of the list. */
233 list_for_each_prev_safe (entry, prev, &stack_cache)
235 struct pthread *curr;
237 curr = list_entry (entry, struct pthread, list);
238 if (FREE_P (curr))
240 /* Unlink the block. */
241 list_del (entry);
243 /* Account for the freed memory. */
244 stack_cache_actsize -= curr->stackblock_size;
246 /* Free the memory associated with the ELF TLS. */
247 _dl_deallocate_tls (TLS_TPADJ (curr), false);
249 /* Remove this block. This should never fail. If it
250 does something is really wrong. */
251 if (munmap (curr->stackblock, curr->stackblock_size) != 0)
252 abort ();
254 /* Maybe we have freed enough. */
255 if (stack_cache_actsize <= stack_cache_maxsize)
256 break;
263 static int
264 internal_function
265 change_stack_perm (struct pthread *pd
266 #ifdef NEED_SEPARATE_REGISTER_STACK
267 , size_t pagemask
268 #endif
271 #ifdef NEED_SEPARATE_REGISTER_STACK
272 void *stack = (pd->stackblock
273 + (((((pd->stackblock_size - pd->guardsize) / 2)
274 & pagemask) + pd->guardsize) & pagemask));
275 size_t len = pd->stackblock + pd->stackblock_size - stack;
276 #else
277 void *stack = pd->stackblock + pd->guardsize;
278 size_t len = pd->stackblock_size - pd->guardsize;
279 #endif
280 if (mprotect (stack, len, PROT_READ | PROT_WRITE | PROT_EXEC) != 0)
281 return errno;
283 return 0;
287 static int
288 allocate_stack (const struct pthread_attr *attr, struct pthread **pdp,
289 ALLOCATE_STACK_PARMS)
291 struct pthread *pd;
292 size_t size;
293 size_t pagesize_m1 = __getpagesize () - 1;
294 void *stacktop;
296 assert (attr != NULL);
297 assert (powerof2 (pagesize_m1 + 1));
298 assert (TCB_ALIGNMENT >= STACK_ALIGN);
300 /* Get the stack size from the attribute if it is set. Otherwise we
301 use the default we determined at start time. */
302 size = attr->stacksize ?: __default_stacksize;
304 /* Get memory for the stack. */
305 if (__builtin_expect (attr->flags & ATTR_FLAG_STACKADDR, 0))
307 uintptr_t adj;
309 /* If the user also specified the size of the stack make sure it
310 is large enough. */
311 if (attr->stacksize != 0
312 && attr->stacksize < (__static_tls_size + MINIMAL_REST_STACK))
313 return EINVAL;
315 /* Adjust stack size for alignment of the TLS block. */
316 #if TLS_TCB_AT_TP
317 adj = ((uintptr_t) attr->stackaddr - TLS_TCB_SIZE)
318 & __static_tls_align_m1;
319 assert (size > adj + TLS_TCB_SIZE);
320 #elif TLS_DTV_AT_TP
321 adj = ((uintptr_t) attr->stackaddr - __static_tls_size)
322 & __static_tls_align_m1;
323 assert (size > adj);
324 #endif
326 /* The user provided some memory. Let's hope it matches the
327 size... We do not allocate guard pages if the user provided
328 the stack. It is the user's responsibility to do this if it
329 is wanted. */
330 #if TLS_TCB_AT_TP
331 pd = (struct pthread *) ((uintptr_t) attr->stackaddr
332 - TLS_TCB_SIZE - adj);
333 #elif TLS_DTV_AT_TP
334 pd = (struct pthread *) (((uintptr_t) attr->stackaddr
335 - __static_tls_size - adj)
336 - TLS_PRE_TCB_SIZE);
337 #endif
339 /* The user provided stack memory needs to be cleared. */
340 memset (pd, '\0', sizeof (struct pthread));
342 /* The first TSD block is included in the TCB. */
343 pd->specific[0] = pd->specific_1stblock;
345 #if defined __ASSUME_CLONE_STOPPED && LLL_LOCK_INITIALIZER != 0
346 /* Initialize the lock. */
347 pd->lock = LLL_LOCK_INITIALIZER;
348 #endif
350 /* Remember the stack-related values. */
351 pd->stackblock = (char *) attr->stackaddr - size;
352 pd->stackblock_size = size;
354 /* This is a user-provided stack. It will not be queued in the
355 stack cache nor will the memory (except the TLS memory) be freed. */
356 pd->user_stack = true;
358 /* This is at least the second thread. */
359 pd->header.multiple_threads = 1;
360 #ifndef TLS_MULTIPLE_THREADS_IN_TCB
361 __pthread_multiple_threads = *__libc_multiple_threads_ptr = 1;
362 #endif
364 #ifdef NEED_DL_SYSINFO
365 /* Copy the sysinfo value from the parent. */
366 THREAD_SYSINFO(pd) = THREAD_SELF_SYSINFO;
367 #endif
369 /* The process ID is also the same as that of the caller. */
370 pd->pid = THREAD_GETMEM (THREAD_SELF, pid);
372 /* Allocate the DTV for this thread. */
373 if (_dl_allocate_tls (TLS_TPADJ (pd)) == NULL)
374 /* Something went wrong. */
375 return errno;
378 /* Prepare to modify global data. */
379 lll_lock (stack_cache_lock);
381 /* And add to the list of stacks in use. */
382 list_add (&pd->list, &__stack_user);
384 lll_unlock (stack_cache_lock);
386 else
388 /* Allocate some anonymous memory. If possible use the cache. */
389 size_t guardsize;
390 size_t reqsize;
391 void *mem;
392 const int prot = (PROT_READ | PROT_WRITE
393 | ((GL(dl_stack_flags) & PF_X) ? PROT_EXEC : 0));
395 #if COLORING_INCREMENT != 0
396 /* Add one more page for stack coloring. Don't do it for stacks
397 with 16 times pagesize or larger. This might just cause
398 unnecessary misalignment. */
399 if (size <= 16 * pagesize_m1)
400 size += pagesize_m1 + 1;
401 #endif
403 /* Adjust the stack size for alignment. */
404 size &= ~__static_tls_align_m1;
405 assert (size != 0);
407 /* Make sure the size of the stack is enough for the guard and
408 eventually the thread descriptor. */
409 guardsize = (attr->guardsize + pagesize_m1) & ~pagesize_m1;
410 if (__builtin_expect (size < (guardsize + __static_tls_size
411 + MINIMAL_REST_STACK + pagesize_m1 + 1),
413 /* The stack is too small (or the guard too large). */
414 return EINVAL;
416 /* Try to get a stack from the cache. */
417 reqsize = size;
418 pd = get_cached_stack (&size, &mem);
419 if (pd == NULL)
421 /* To avoid aliasing effects on a larger scale then pages we
422 adjust the allocated stack size if necessary. This way
423 allocations directly following each other will not have
424 aliasing problems. */
425 #if MULTI_PAGE_ALIASING != 0
426 if ((size % MULTI_PAGE_ALIASING) == 0)
427 size += pagesize_m1 + 1;
428 #endif
430 mem = mmap (NULL, size, prot,
431 MAP_PRIVATE | MAP_ANONYMOUS | ARCH_MAP_FLAGS, -1, 0);
433 if (__builtin_expect (mem == MAP_FAILED, 0))
435 #ifdef ARCH_RETRY_MMAP
436 mem = ARCH_RETRY_MMAP (size);
437 if (__builtin_expect (mem == MAP_FAILED, 0))
438 #endif
439 return errno;
442 /* SIZE is guaranteed to be greater than zero.
443 So we can never get a null pointer back from mmap. */
444 assert (mem != NULL);
446 #if COLORING_INCREMENT != 0
447 /* Atomically increment NCREATED. */
448 unsigned int ncreated = atomic_increment_val (&nptl_ncreated);
450 /* We chose the offset for coloring by incrementing it for
451 every new thread by a fixed amount. The offset used
452 module the page size. Even if coloring would be better
453 relative to higher alignment values it makes no sense to
454 do it since the mmap() interface does not allow us to
455 specify any alignment for the returned memory block. */
456 size_t coloring = (ncreated * COLORING_INCREMENT) & pagesize_m1;
458 /* Make sure the coloring offsets does not disturb the alignment
459 of the TCB and static TLS block. */
460 if (__builtin_expect ((coloring & __static_tls_align_m1) != 0, 0))
461 coloring = (((coloring + __static_tls_align_m1)
462 & ~(__static_tls_align_m1))
463 & ~pagesize_m1);
464 #else
465 /* Unless specified we do not make any adjustments. */
466 # define coloring 0
467 #endif
469 /* Place the thread descriptor at the end of the stack. */
470 #if TLS_TCB_AT_TP
471 pd = (struct pthread *) ((char *) mem + size - coloring) - 1;
472 #elif TLS_DTV_AT_TP
473 pd = (struct pthread *) ((((uintptr_t) mem + size - coloring
474 - __static_tls_size)
475 & ~__static_tls_align_m1)
476 - TLS_PRE_TCB_SIZE);
477 #endif
479 /* Remember the stack-related values. */
480 pd->stackblock = mem;
481 pd->stackblock_size = size;
483 /* We allocated the first block thread-specific data array.
484 This address will not change for the lifetime of this
485 descriptor. */
486 pd->specific[0] = pd->specific_1stblock;
488 #if defined __ASSUME_CLONE_STOPPED && LLL_LOCK_INITIALIZER != 0
489 /* Initialize the lock. */
490 pd->lock = LLL_LOCK_INITIALIZER;
491 #endif
493 /* This is at least the second thread. */
494 pd->header.multiple_threads = 1;
495 #ifndef TLS_MULTIPLE_THREADS_IN_TCB
496 __pthread_multiple_threads = *__libc_multiple_threads_ptr = 1;
497 #endif
499 #ifdef NEED_DL_SYSINFO
500 /* Copy the sysinfo value from the parent. */
501 THREAD_SYSINFO(pd) = THREAD_SELF_SYSINFO;
502 #endif
504 /* The process ID is also the same as that of the caller. */
505 pd->pid = THREAD_GETMEM (THREAD_SELF, pid);
507 /* Allocate the DTV for this thread. */
508 if (_dl_allocate_tls (TLS_TPADJ (pd)) == NULL)
510 /* Something went wrong. */
511 int err = errno;
513 /* Free the stack memory we just allocated. */
514 (void) munmap (mem, size);
516 return err;
520 /* Prepare to modify global data. */
521 lll_lock (stack_cache_lock);
523 /* And add to the list of stacks in use. */
524 list_add (&pd->list, &stack_used);
526 lll_unlock (stack_cache_lock);
529 /* There might have been a race. Another thread might have
530 caused the stacks to get exec permission while this new
531 stack was prepared. Detect if this was possible and
532 change the permission if necessary. */
533 if (__builtin_expect ((GL(dl_stack_flags) & PF_X) != 0
534 && (prot & PROT_EXEC) == 0, 0))
536 int err = change_stack_perm (pd
537 #ifdef NEED_SEPARATE_REGISTER_STACK
538 , ~pagesize_m1
539 #endif
541 if (err != 0)
543 /* Free the stack memory we just allocated. */
544 (void) munmap (mem, size);
546 return err;
551 /* Note that all of the stack and the thread descriptor is
552 zeroed. This means we do not have to initialize fields
553 with initial value zero. This is specifically true for
554 the 'tid' field which is always set back to zero once the
555 stack is not used anymore and for the 'guardsize' field
556 which will be read next. */
559 /* Create or resize the guard area if necessary. */
560 if (__builtin_expect (guardsize > pd->guardsize, 0))
562 #ifdef NEED_SEPARATE_REGISTER_STACK
563 char *guard = mem + (((size - guardsize) / 2) & ~pagesize_m1);
564 #else
565 char *guard = mem;
566 #endif
567 if (mprotect (guard, guardsize, PROT_NONE) != 0)
569 int err;
570 mprot_error:
571 err = errno;
573 lll_lock (stack_cache_lock);
575 /* Remove the thread from the list. */
576 list_del (&pd->list);
578 lll_unlock (stack_cache_lock);
580 /* Get rid of the TLS block we allocated. */
581 _dl_deallocate_tls (TLS_TPADJ (pd), false);
583 /* Free the stack memory regardless of whether the size
584 of the cache is over the limit or not. If this piece
585 of memory caused problems we better do not use it
586 anymore. Uh, and we ignore possible errors. There
587 is nothing we could do. */
588 (void) munmap (mem, size);
590 return err;
593 pd->guardsize = guardsize;
595 else if (__builtin_expect (pd->guardsize - guardsize > size - reqsize,
598 /* The old guard area is too large. */
600 #ifdef NEED_SEPARATE_REGISTER_STACK
601 char *guard = mem + (((size - guardsize) / 2) & ~pagesize_m1);
602 char *oldguard = mem + (((size - pd->guardsize) / 2) & ~pagesize_m1);
604 if (oldguard < guard
605 && mprotect (oldguard, guard - oldguard, prot) != 0)
606 goto mprot_error;
608 if (mprotect (guard + guardsize,
609 oldguard + pd->guardsize - guard - guardsize,
610 prot) != 0)
611 goto mprot_error;
612 #else
613 if (mprotect ((char *) mem + guardsize, pd->guardsize - guardsize,
614 prot) != 0)
615 goto mprot_error;
616 #endif
618 pd->guardsize = guardsize;
620 /* The pthread_getattr_np() calls need to get passed the size
621 requested in the attribute, regardless of how large the
622 actually used guardsize is. */
623 pd->reported_guardsize = guardsize;
626 #ifndef __ASSUME_CLONE_STOPPED
627 /* Initialize the lock. We have to do this unconditionally if the
628 CLONE_STOPPED flag is not available since then the stillborn
629 thread could be canceled while the lock is taken. */
630 pd->lock = LLL_LOCK_INITIALIZER;
631 #endif
633 /* We place the thread descriptor at the end of the stack. */
634 *pdp = pd;
636 #if TLS_TCB_AT_TP
637 /* The stack begins before the TCB and the static TLS block. */
638 stacktop = ((char *) (pd + 1) - __static_tls_size);
639 #elif TLS_DTV_AT_TP
640 stacktop = (char *) (pd - 1);
641 #endif
643 #ifdef NEED_SEPARATE_REGISTER_STACK
644 *stack = pd->stackblock;
645 *stacksize = stacktop - *stack;
646 #else
647 *stack = stacktop;
648 #endif
650 return 0;
654 void
655 internal_function
656 __deallocate_stack (struct pthread *pd)
658 lll_lock (stack_cache_lock);
660 /* Remove the thread from the list of threads with user defined
661 stacks. */
662 list_del (&pd->list);
664 /* Not much to do. Just free the mmap()ed memory. Note that we do
665 not reset the 'used' flag in the 'tid' field. This is done by
666 the kernel. If no thread has been created yet this field is
667 still zero. */
668 if (__builtin_expect (! pd->user_stack, 1))
669 (void) queue_stack (pd);
670 else
671 /* Free the memory associated with the ELF TLS. */
672 _dl_deallocate_tls (TLS_TPADJ (pd), false);
674 lll_unlock (stack_cache_lock);
679 internal_function
680 __make_stacks_executable (void **stack_endp)
682 /* First the main thread's stack. */
683 int err = _dl_make_stack_executable (stack_endp);
684 if (err != 0)
685 return err;
687 #ifdef NEED_SEPARATE_REGISTER_STACK
688 const size_t pagemask = ~(__getpagesize () - 1);
689 #endif
691 lll_lock (stack_cache_lock);
693 list_t *runp;
694 list_for_each (runp, &stack_used)
696 err = change_stack_perm (list_entry (runp, struct pthread, list)
697 #ifdef NEED_SEPARATE_REGISTER_STACK
698 , pagemask
699 #endif
701 if (err != 0)
702 break;
705 /* Also change the permission for the currently unused stacks. This
706 might be wasted time but better spend it here than adding a check
707 in the fast path. */
708 if (err == 0)
709 list_for_each (runp, &stack_cache)
711 err = change_stack_perm (list_entry (runp, struct pthread, list)
712 #ifdef NEED_SEPARATE_REGISTER_STACK
713 , pagemask
714 #endif
716 if (err != 0)
717 break;
720 lll_unlock (stack_cache_lock);
722 return err;
726 /* In case of a fork() call the memory allocation in the child will be
727 the same but only one thread is running. All stacks except that of
728 the one running thread are not used anymore. We have to recycle
729 them. */
730 void
731 __reclaim_stacks (void)
733 struct pthread *self = (struct pthread *) THREAD_SELF;
735 /* No locking necessary. The caller is the only stack in use. */
737 /* Mark all stacks except the still running one as free. */
738 list_t *runp;
739 list_for_each (runp, &stack_used)
741 struct pthread *curp;
743 curp = list_entry (runp, struct pthread, list);
744 if (curp != self)
746 /* This marks the stack as free. */
747 curp->tid = 0;
749 /* The PID field must be initialized for the new process. */
750 curp->pid = self->pid;
752 /* Account for the size of the stack. */
753 stack_cache_actsize += curp->stackblock_size;
757 /* Add the stack of all running threads to the cache. */
758 list_splice (&stack_used, &stack_cache);
760 /* Remove the entry for the current thread to from the cache list
761 and add it to the list of running threads. Which of the two
762 lists is decided by the user_stack flag. */
763 list_del (&self->list);
765 /* Re-initialize the lists for all the threads. */
766 INIT_LIST_HEAD (&stack_used);
767 INIT_LIST_HEAD (&__stack_user);
769 if (__builtin_expect (THREAD_GETMEM (self, user_stack), 0))
770 list_add (&self->list, &__stack_user);
771 else
772 list_add (&self->list, &stack_used);
774 /* There is one thread running. */
775 __nptl_nthreads = 1;
777 /* Initialize the lock. */
778 stack_cache_lock = LLL_LOCK_INITIALIZER;
782 #if HP_TIMING_AVAIL
783 /* Find a thread given the thread ID. */
784 struct pthread *
785 attribute_hidden
786 __find_thread_by_id (pid_t tid)
788 struct pthread *result = NULL;
790 lll_lock (stack_cache_lock);
792 /* Iterate over the list with system-allocated threads first. */
793 list_t *runp;
794 list_for_each (runp, &stack_used)
796 struct pthread *curp;
798 curp = list_entry (runp, struct pthread, list);
800 if (curp->tid == tid)
802 result = curp;
803 goto out;
807 /* Now the list with threads using user-allocated stacks. */
808 list_for_each (runp, &__stack_user)
810 struct pthread *curp;
812 curp = list_entry (runp, struct pthread, list);
814 if (curp->tid == tid)
816 result = curp;
817 goto out;
821 out:
822 lll_unlock (stack_cache_lock);
824 return result;
826 #endif
828 static inline void __attribute__((always_inline))
829 init_one_static_tls (struct pthread *curp, struct link_map *map)
831 dtv_t *dtv = GET_DTV (TLS_TPADJ (curp));
832 # if TLS_TCB_AT_TP
833 void *dest = (char *) curp - map->l_tls_offset;
834 # elif TLS_DTV_AT_TP
835 void *dest = (char *) curp + map->l_tls_offset + TLS_PRE_TCB_SIZE;
836 # else
837 # error "Either TLS_TCB_AT_TP or TLS_DTV_AT_TP must be defined"
838 # endif
840 /* Fill in the DTV slot so that a later LD/GD access will find it. */
841 dtv[map->l_tls_modid].pointer = dest;
843 /* Initialize the memory. */
844 memset (__mempcpy (dest, map->l_tls_initimage, map->l_tls_initimage_size),
845 '\0', map->l_tls_blocksize - map->l_tls_initimage_size);
848 void
849 attribute_hidden
850 __pthread_init_static_tls (struct link_map *map)
852 lll_lock (stack_cache_lock);
854 /* Iterate over the list with system-allocated threads first. */
855 list_t *runp;
856 list_for_each (runp, &stack_used)
857 init_one_static_tls (list_entry (runp, struct pthread, list), map);
859 /* Now the list with threads using user-allocated stacks. */
860 list_for_each (runp, &__stack_user)
861 init_one_static_tls (list_entry (runp, struct pthread, list), map);
863 lll_unlock (stack_cache_lock);