(CFLAGS-tst-align.c): Add -mpreferred-stack-boundary=4.
[glibc.git] / malloc / malloc.c
blobe3ccbde7b5b84affbf6ff2387a5151310235f0a3
1 /* Malloc implementation for multiple threads without lock contention.
2 Copyright (C) 1996-2002, 2003, 2004 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
4 Contributed by Wolfram Gloger <wg@malloc.de>
5 and Doug Lea <dl@cs.oswego.edu>, 2001.
7 The GNU C Library is free software; you can redistribute it and/or
8 modify it under the terms of the GNU Lesser General Public License as
9 published by the Free Software Foundation; either version 2.1 of the
10 License, or (at your option) any later version.
12 The GNU C Library is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 Lesser General Public License for more details.
17 You should have received a copy of the GNU Lesser General Public
18 License along with the GNU C Library; see the file COPYING.LIB. If not,
19 write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
20 Boston, MA 02111-1307, USA. */
23 This is a version (aka ptmalloc2) of malloc/free/realloc written by
24 Doug Lea and adapted to multiple threads/arenas by Wolfram Gloger.
26 * Version ptmalloc2-20011215
27 $Id$
28 based on:
29 VERSION 2.7.0 Sun Mar 11 14:14:06 2001 Doug Lea (dl at gee)
31 Note: There may be an updated version of this malloc obtainable at
32 http://www.malloc.de/malloc/ptmalloc2.tar.gz
33 Check before installing!
35 * Quickstart
37 In order to compile this implementation, a Makefile is provided with
38 the ptmalloc2 distribution, which has pre-defined targets for some
39 popular systems (e.g. "make posix" for Posix threads). All that is
40 typically required with regard to compiler flags is the selection of
41 the thread package via defining one out of USE_PTHREADS, USE_THR or
42 USE_SPROC. Check the thread-m.h file for what effects this has.
43 Many/most systems will additionally require USE_TSD_DATA_HACK to be
44 defined, so this is the default for "make posix".
46 * Why use this malloc?
48 This is not the fastest, most space-conserving, most portable, or
49 most tunable malloc ever written. However it is among the fastest
50 while also being among the most space-conserving, portable and tunable.
51 Consistent balance across these factors results in a good general-purpose
52 allocator for malloc-intensive programs.
54 The main properties of the algorithms are:
55 * For large (>= 512 bytes) requests, it is a pure best-fit allocator,
56 with ties normally decided via FIFO (i.e. least recently used).
57 * For small (<= 64 bytes by default) requests, it is a caching
58 allocator, that maintains pools of quickly recycled chunks.
59 * In between, and for combinations of large and small requests, it does
60 the best it can trying to meet both goals at once.
61 * For very large requests (>= 128KB by default), it relies on system
62 memory mapping facilities, if supported.
64 For a longer but slightly out of date high-level description, see
65 http://gee.cs.oswego.edu/dl/html/malloc.html
67 You may already by default be using a C library containing a malloc
68 that is based on some version of this malloc (for example in
69 linux). You might still want to use the one in this file in order to
70 customize settings or to avoid overheads associated with library
71 versions.
73 * Contents, described in more detail in "description of public routines" below.
75 Standard (ANSI/SVID/...) functions:
76 malloc(size_t n);
77 calloc(size_t n_elements, size_t element_size);
78 free(Void_t* p);
79 realloc(Void_t* p, size_t n);
80 memalign(size_t alignment, size_t n);
81 valloc(size_t n);
82 mallinfo()
83 mallopt(int parameter_number, int parameter_value)
85 Additional functions:
86 independent_calloc(size_t n_elements, size_t size, Void_t* chunks[]);
87 independent_comalloc(size_t n_elements, size_t sizes[], Void_t* chunks[]);
88 pvalloc(size_t n);
89 cfree(Void_t* p);
90 malloc_trim(size_t pad);
91 malloc_usable_size(Void_t* p);
92 malloc_stats();
94 * Vital statistics:
96 Supported pointer representation: 4 or 8 bytes
97 Supported size_t representation: 4 or 8 bytes
98 Note that size_t is allowed to be 4 bytes even if pointers are 8.
99 You can adjust this by defining INTERNAL_SIZE_T
101 Alignment: 2 * sizeof(size_t) (default)
102 (i.e., 8 byte alignment with 4byte size_t). This suffices for
103 nearly all current machines and C compilers. However, you can
104 define MALLOC_ALIGNMENT to be wider than this if necessary.
106 Minimum overhead per allocated chunk: 4 or 8 bytes
107 Each malloced chunk has a hidden word of overhead holding size
108 and status information.
110 Minimum allocated size: 4-byte ptrs: 16 bytes (including 4 overhead)
111 8-byte ptrs: 24/32 bytes (including, 4/8 overhead)
113 When a chunk is freed, 12 (for 4byte ptrs) or 20 (for 8 byte
114 ptrs but 4 byte size) or 24 (for 8/8) additional bytes are
115 needed; 4 (8) for a trailing size field and 8 (16) bytes for
116 free list pointers. Thus, the minimum allocatable size is
117 16/24/32 bytes.
119 Even a request for zero bytes (i.e., malloc(0)) returns a
120 pointer to something of the minimum allocatable size.
122 The maximum overhead wastage (i.e., number of extra bytes
123 allocated than were requested in malloc) is less than or equal
124 to the minimum size, except for requests >= mmap_threshold that
125 are serviced via mmap(), where the worst case wastage is 2 *
126 sizeof(size_t) bytes plus the remainder from a system page (the
127 minimal mmap unit); typically 4096 or 8192 bytes.
129 Maximum allocated size: 4-byte size_t: 2^32 minus about two pages
130 8-byte size_t: 2^64 minus about two pages
132 It is assumed that (possibly signed) size_t values suffice to
133 represent chunk sizes. `Possibly signed' is due to the fact
134 that `size_t' may be defined on a system as either a signed or
135 an unsigned type. The ISO C standard says that it must be
136 unsigned, but a few systems are known not to adhere to this.
137 Additionally, even when size_t is unsigned, sbrk (which is by
138 default used to obtain memory from system) accepts signed
139 arguments, and may not be able to handle size_t-wide arguments
140 with negative sign bit. Generally, values that would
141 appear as negative after accounting for overhead and alignment
142 are supported only via mmap(), which does not have this
143 limitation.
145 Requests for sizes outside the allowed range will perform an optional
146 failure action and then return null. (Requests may also
147 also fail because a system is out of memory.)
149 Thread-safety: thread-safe unless NO_THREADS is defined
151 Compliance: I believe it is compliant with the 1997 Single Unix Specification
152 (See http://www.opennc.org). Also SVID/XPG, ANSI C, and probably
153 others as well.
155 * Synopsis of compile-time options:
157 People have reported using previous versions of this malloc on all
158 versions of Unix, sometimes by tweaking some of the defines
159 below. It has been tested most extensively on Solaris and
160 Linux. It is also reported to work on WIN32 platforms.
161 People also report using it in stand-alone embedded systems.
163 The implementation is in straight, hand-tuned ANSI C. It is not
164 at all modular. (Sorry!) It uses a lot of macros. To be at all
165 usable, this code should be compiled using an optimizing compiler
166 (for example gcc -O3) that can simplify expressions and control
167 paths. (FAQ: some macros import variables as arguments rather than
168 declare locals because people reported that some debuggers
169 otherwise get confused.)
171 OPTION DEFAULT VALUE
173 Compilation Environment options:
175 __STD_C derived from C compiler defines
176 WIN32 NOT defined
177 HAVE_MEMCPY defined
178 USE_MEMCPY 1 if HAVE_MEMCPY is defined
179 HAVE_MMAP defined as 1
180 MMAP_CLEARS 1
181 HAVE_MREMAP 0 unless linux defined
182 USE_ARENAS the same as HAVE_MMAP
183 malloc_getpagesize derived from system #includes, or 4096 if not
184 HAVE_USR_INCLUDE_MALLOC_H NOT defined
185 LACKS_UNISTD_H NOT defined unless WIN32
186 LACKS_SYS_PARAM_H NOT defined unless WIN32
187 LACKS_SYS_MMAN_H NOT defined unless WIN32
189 Changing default word sizes:
191 INTERNAL_SIZE_T size_t
192 MALLOC_ALIGNMENT 2 * sizeof(INTERNAL_SIZE_T)
194 Configuration and functionality options:
196 USE_DL_PREFIX NOT defined
197 USE_PUBLIC_MALLOC_WRAPPERS NOT defined
198 USE_MALLOC_LOCK NOT defined
199 MALLOC_DEBUG NOT defined
200 REALLOC_ZERO_BYTES_FREES 1
201 MALLOC_FAILURE_ACTION errno = ENOMEM, if __STD_C defined, else no-op
202 TRIM_FASTBINS 0
204 Options for customizing MORECORE:
206 MORECORE sbrk
207 MORECORE_FAILURE -1
208 MORECORE_CONTIGUOUS 1
209 MORECORE_CANNOT_TRIM NOT defined
210 MORECORE_CLEARS 1
211 MMAP_AS_MORECORE_SIZE (1024 * 1024)
213 Tuning options that are also dynamically changeable via mallopt:
215 DEFAULT_MXFAST 64
216 DEFAULT_TRIM_THRESHOLD 128 * 1024
217 DEFAULT_TOP_PAD 0
218 DEFAULT_MMAP_THRESHOLD 128 * 1024
219 DEFAULT_MMAP_MAX 65536
221 There are several other #defined constants and macros that you
222 probably don't want to touch unless you are extending or adapting malloc. */
225 __STD_C should be nonzero if using ANSI-standard C compiler, a C++
226 compiler, or a C compiler sufficiently close to ANSI to get away
227 with it.
230 #ifndef __STD_C
231 #if defined(__STDC__) || defined(__cplusplus)
232 #define __STD_C 1
233 #else
234 #define __STD_C 0
235 #endif
236 #endif /*__STD_C*/
240 Void_t* is the pointer type that malloc should say it returns
243 #ifndef Void_t
244 #if (__STD_C || defined(WIN32))
245 #define Void_t void
246 #else
247 #define Void_t char
248 #endif
249 #endif /*Void_t*/
251 #if __STD_C
252 #include <stddef.h> /* for size_t */
253 #include <stdlib.h> /* for getenv(), abort() */
254 #else
255 #include <sys/types.h>
256 #endif
258 #include <malloc-machine.h>
260 #ifdef _LIBC
261 #include <stdio-common/_itoa.h>
262 #endif
264 #ifdef __cplusplus
265 extern "C" {
266 #endif
268 /* define LACKS_UNISTD_H if your system does not have a <unistd.h>. */
270 /* #define LACKS_UNISTD_H */
272 #ifndef LACKS_UNISTD_H
273 #include <unistd.h>
274 #endif
276 /* define LACKS_SYS_PARAM_H if your system does not have a <sys/param.h>. */
278 /* #define LACKS_SYS_PARAM_H */
281 #include <stdio.h> /* needed for malloc_stats */
282 #include <errno.h> /* needed for optional MALLOC_FAILURE_ACTION */
284 /* For uintptr_t. */
285 #include <stdint.h>
287 /* For va_arg, va_start, va_end. */
288 #include <stdarg.h>
290 /* For writev and struct iovec. */
291 #include <sys/uio.h>
292 /* For syslog. */
293 #include <sys/syslog.h>
295 /* For various dynamic linking things. */
296 #include <dlfcn.h>
300 Debugging:
302 Because freed chunks may be overwritten with bookkeeping fields, this
303 malloc will often die when freed memory is overwritten by user
304 programs. This can be very effective (albeit in an annoying way)
305 in helping track down dangling pointers.
307 If you compile with -DMALLOC_DEBUG, a number of assertion checks are
308 enabled that will catch more memory errors. You probably won't be
309 able to make much sense of the actual assertion errors, but they
310 should help you locate incorrectly overwritten memory. The checking
311 is fairly extensive, and will slow down execution
312 noticeably. Calling malloc_stats or mallinfo with MALLOC_DEBUG set
313 will attempt to check every non-mmapped allocated and free chunk in
314 the course of computing the summmaries. (By nature, mmapped regions
315 cannot be checked very much automatically.)
317 Setting MALLOC_DEBUG may also be helpful if you are trying to modify
318 this code. The assertions in the check routines spell out in more
319 detail the assumptions and invariants underlying the algorithms.
321 Setting MALLOC_DEBUG does NOT provide an automated mechanism for
322 checking that all accesses to malloced memory stay within their
323 bounds. However, there are several add-ons and adaptations of this
324 or other mallocs available that do this.
327 #if MALLOC_DEBUG
328 #include <assert.h>
329 #else
330 #undef assert
331 #define assert(x) ((void)0)
332 #endif
336 INTERNAL_SIZE_T is the word-size used for internal bookkeeping
337 of chunk sizes.
339 The default version is the same as size_t.
341 While not strictly necessary, it is best to define this as an
342 unsigned type, even if size_t is a signed type. This may avoid some
343 artificial size limitations on some systems.
345 On a 64-bit machine, you may be able to reduce malloc overhead by
346 defining INTERNAL_SIZE_T to be a 32 bit `unsigned int' at the
347 expense of not being able to handle more than 2^32 of malloced
348 space. If this limitation is acceptable, you are encouraged to set
349 this unless you are on a platform requiring 16byte alignments. In
350 this case the alignment requirements turn out to negate any
351 potential advantages of decreasing size_t word size.
353 Implementors: Beware of the possible combinations of:
354 - INTERNAL_SIZE_T might be signed or unsigned, might be 32 or 64 bits,
355 and might be the same width as int or as long
356 - size_t might have different width and signedness as INTERNAL_SIZE_T
357 - int and long might be 32 or 64 bits, and might be the same width
358 To deal with this, most comparisons and difference computations
359 among INTERNAL_SIZE_Ts should cast them to unsigned long, being
360 aware of the fact that casting an unsigned int to a wider long does
361 not sign-extend. (This also makes checking for negative numbers
362 awkward.) Some of these casts result in harmless compiler warnings
363 on some systems.
366 #ifndef INTERNAL_SIZE_T
367 #define INTERNAL_SIZE_T size_t
368 #endif
370 /* The corresponding word size */
371 #define SIZE_SZ (sizeof(INTERNAL_SIZE_T))
375 MALLOC_ALIGNMENT is the minimum alignment for malloc'ed chunks.
376 It must be a power of two at least 2 * SIZE_SZ, even on machines
377 for which smaller alignments would suffice. It may be defined as
378 larger than this though. Note however that code and data structures
379 are optimized for the case of 8-byte alignment.
383 #ifndef MALLOC_ALIGNMENT
384 #define MALLOC_ALIGNMENT (2 * SIZE_SZ)
385 #endif
387 /* The corresponding bit mask value */
388 #define MALLOC_ALIGN_MASK (MALLOC_ALIGNMENT - 1)
393 REALLOC_ZERO_BYTES_FREES should be set if a call to
394 realloc with zero bytes should be the same as a call to free.
395 This is required by the C standard. Otherwise, since this malloc
396 returns a unique pointer for malloc(0), so does realloc(p, 0).
399 #ifndef REALLOC_ZERO_BYTES_FREES
400 #define REALLOC_ZERO_BYTES_FREES 1
401 #endif
404 TRIM_FASTBINS controls whether free() of a very small chunk can
405 immediately lead to trimming. Setting to true (1) can reduce memory
406 footprint, but will almost always slow down programs that use a lot
407 of small chunks.
409 Define this only if you are willing to give up some speed to more
410 aggressively reduce system-level memory footprint when releasing
411 memory in programs that use many small chunks. You can get
412 essentially the same effect by setting MXFAST to 0, but this can
413 lead to even greater slowdowns in programs using many small chunks.
414 TRIM_FASTBINS is an in-between compile-time option, that disables
415 only those chunks bordering topmost memory from being placed in
416 fastbins.
419 #ifndef TRIM_FASTBINS
420 #define TRIM_FASTBINS 0
421 #endif
425 USE_DL_PREFIX will prefix all public routines with the string 'dl'.
426 This is necessary when you only want to use this malloc in one part
427 of a program, using your regular system malloc elsewhere.
430 /* #define USE_DL_PREFIX */
434 Two-phase name translation.
435 All of the actual routines are given mangled names.
436 When wrappers are used, they become the public callable versions.
437 When DL_PREFIX is used, the callable names are prefixed.
440 #ifdef USE_DL_PREFIX
441 #define public_cALLOc dlcalloc
442 #define public_fREe dlfree
443 #define public_cFREe dlcfree
444 #define public_mALLOc dlmalloc
445 #define public_mEMALIGn dlmemalign
446 #define public_rEALLOc dlrealloc
447 #define public_vALLOc dlvalloc
448 #define public_pVALLOc dlpvalloc
449 #define public_mALLINFo dlmallinfo
450 #define public_mALLOPt dlmallopt
451 #define public_mTRIm dlmalloc_trim
452 #define public_mSTATs dlmalloc_stats
453 #define public_mUSABLe dlmalloc_usable_size
454 #define public_iCALLOc dlindependent_calloc
455 #define public_iCOMALLOc dlindependent_comalloc
456 #define public_gET_STATe dlget_state
457 #define public_sET_STATe dlset_state
458 #else /* USE_DL_PREFIX */
459 #ifdef _LIBC
461 /* Special defines for the GNU C library. */
462 #define public_cALLOc __libc_calloc
463 #define public_fREe __libc_free
464 #define public_cFREe __libc_cfree
465 #define public_mALLOc __libc_malloc
466 #define public_mEMALIGn __libc_memalign
467 #define public_rEALLOc __libc_realloc
468 #define public_vALLOc __libc_valloc
469 #define public_pVALLOc __libc_pvalloc
470 #define public_mALLINFo __libc_mallinfo
471 #define public_mALLOPt __libc_mallopt
472 #define public_mTRIm __malloc_trim
473 #define public_mSTATs __malloc_stats
474 #define public_mUSABLe __malloc_usable_size
475 #define public_iCALLOc __libc_independent_calloc
476 #define public_iCOMALLOc __libc_independent_comalloc
477 #define public_gET_STATe __malloc_get_state
478 #define public_sET_STATe __malloc_set_state
479 #define malloc_getpagesize __getpagesize()
480 #define open __open
481 #define mmap __mmap
482 #define munmap __munmap
483 #define mremap __mremap
484 #define mprotect __mprotect
485 #define MORECORE (*__morecore)
486 #define MORECORE_FAILURE 0
488 Void_t * __default_morecore (ptrdiff_t);
489 Void_t *(*__morecore)(ptrdiff_t) = __default_morecore;
491 #else /* !_LIBC */
492 #define public_cALLOc calloc
493 #define public_fREe free
494 #define public_cFREe cfree
495 #define public_mALLOc malloc
496 #define public_mEMALIGn memalign
497 #define public_rEALLOc realloc
498 #define public_vALLOc valloc
499 #define public_pVALLOc pvalloc
500 #define public_mALLINFo mallinfo
501 #define public_mALLOPt mallopt
502 #define public_mTRIm malloc_trim
503 #define public_mSTATs malloc_stats
504 #define public_mUSABLe malloc_usable_size
505 #define public_iCALLOc independent_calloc
506 #define public_iCOMALLOc independent_comalloc
507 #define public_gET_STATe malloc_get_state
508 #define public_sET_STATe malloc_set_state
509 #endif /* _LIBC */
510 #endif /* USE_DL_PREFIX */
512 #ifndef _LIBC
513 #define __builtin_expect(expr, val) (expr)
515 #define fwrite(buf, size, count, fp) _IO_fwrite (buf, size, count, fp)
516 #endif
519 HAVE_MEMCPY should be defined if you are not otherwise using
520 ANSI STD C, but still have memcpy and memset in your C library
521 and want to use them in calloc and realloc. Otherwise simple
522 macro versions are defined below.
524 USE_MEMCPY should be defined as 1 if you actually want to
525 have memset and memcpy called. People report that the macro
526 versions are faster than libc versions on some systems.
528 Even if USE_MEMCPY is set to 1, loops to copy/clear small chunks
529 (of <= 36 bytes) are manually unrolled in realloc and calloc.
532 #define HAVE_MEMCPY
534 #ifndef USE_MEMCPY
535 #ifdef HAVE_MEMCPY
536 #define USE_MEMCPY 1
537 #else
538 #define USE_MEMCPY 0
539 #endif
540 #endif
543 #if (__STD_C || defined(HAVE_MEMCPY))
545 #ifdef _LIBC
546 # include <string.h>
547 #else
548 #ifdef WIN32
549 /* On Win32 memset and memcpy are already declared in windows.h */
550 #else
551 #if __STD_C
552 void* memset(void*, int, size_t);
553 void* memcpy(void*, const void*, size_t);
554 #else
555 Void_t* memset();
556 Void_t* memcpy();
557 #endif
558 #endif
559 #endif
560 #endif
563 MALLOC_FAILURE_ACTION is the action to take before "return 0" when
564 malloc fails to be able to return memory, either because memory is
565 exhausted or because of illegal arguments.
567 By default, sets errno if running on STD_C platform, else does nothing.
570 #ifndef MALLOC_FAILURE_ACTION
571 #if __STD_C
572 #define MALLOC_FAILURE_ACTION \
573 errno = ENOMEM;
575 #else
576 #define MALLOC_FAILURE_ACTION
577 #endif
578 #endif
581 MORECORE-related declarations. By default, rely on sbrk
585 #ifdef LACKS_UNISTD_H
586 #if !defined(__FreeBSD__) && !defined(__OpenBSD__) && !defined(__NetBSD__)
587 #if __STD_C
588 extern Void_t* sbrk(ptrdiff_t);
589 #else
590 extern Void_t* sbrk();
591 #endif
592 #endif
593 #endif
596 MORECORE is the name of the routine to call to obtain more memory
597 from the system. See below for general guidance on writing
598 alternative MORECORE functions, as well as a version for WIN32 and a
599 sample version for pre-OSX macos.
602 #ifndef MORECORE
603 #define MORECORE sbrk
604 #endif
607 MORECORE_FAILURE is the value returned upon failure of MORECORE
608 as well as mmap. Since it cannot be an otherwise valid memory address,
609 and must reflect values of standard sys calls, you probably ought not
610 try to redefine it.
613 #ifndef MORECORE_FAILURE
614 #define MORECORE_FAILURE (-1)
615 #endif
618 If MORECORE_CONTIGUOUS is true, take advantage of fact that
619 consecutive calls to MORECORE with positive arguments always return
620 contiguous increasing addresses. This is true of unix sbrk. Even
621 if not defined, when regions happen to be contiguous, malloc will
622 permit allocations spanning regions obtained from different
623 calls. But defining this when applicable enables some stronger
624 consistency checks and space efficiencies.
627 #ifndef MORECORE_CONTIGUOUS
628 #define MORECORE_CONTIGUOUS 1
629 #endif
632 Define MORECORE_CANNOT_TRIM if your version of MORECORE
633 cannot release space back to the system when given negative
634 arguments. This is generally necessary only if you are using
635 a hand-crafted MORECORE function that cannot handle negative arguments.
638 /* #define MORECORE_CANNOT_TRIM */
640 /* MORECORE_CLEARS (default 1)
641 The degree to which the routine mapped to MORECORE zeroes out
642 memory: never (0), only for newly allocated space (1) or always
643 (2). The distinction between (1) and (2) is necessary because on
644 some systems, if the application first decrements and then
645 increments the break value, the contents of the reallocated space
646 are unspecified.
649 #ifndef MORECORE_CLEARS
650 #define MORECORE_CLEARS 1
651 #endif
655 Define HAVE_MMAP as true to optionally make malloc() use mmap() to
656 allocate very large blocks. These will be returned to the
657 operating system immediately after a free(). Also, if mmap
658 is available, it is used as a backup strategy in cases where
659 MORECORE fails to provide space from system.
661 This malloc is best tuned to work with mmap for large requests.
662 If you do not have mmap, operations involving very large chunks (1MB
663 or so) may be slower than you'd like.
666 #ifndef HAVE_MMAP
667 #define HAVE_MMAP 1
670 Standard unix mmap using /dev/zero clears memory so calloc doesn't
671 need to.
674 #ifndef MMAP_CLEARS
675 #define MMAP_CLEARS 1
676 #endif
678 #else /* no mmap */
679 #ifndef MMAP_CLEARS
680 #define MMAP_CLEARS 0
681 #endif
682 #endif
686 MMAP_AS_MORECORE_SIZE is the minimum mmap size argument to use if
687 sbrk fails, and mmap is used as a backup (which is done only if
688 HAVE_MMAP). The value must be a multiple of page size. This
689 backup strategy generally applies only when systems have "holes" in
690 address space, so sbrk cannot perform contiguous expansion, but
691 there is still space available on system. On systems for which
692 this is known to be useful (i.e. most linux kernels), this occurs
693 only when programs allocate huge amounts of memory. Between this,
694 and the fact that mmap regions tend to be limited, the size should
695 be large, to avoid too many mmap calls and thus avoid running out
696 of kernel resources.
699 #ifndef MMAP_AS_MORECORE_SIZE
700 #define MMAP_AS_MORECORE_SIZE (1024 * 1024)
701 #endif
704 Define HAVE_MREMAP to make realloc() use mremap() to re-allocate
705 large blocks. This is currently only possible on Linux with
706 kernel versions newer than 1.3.77.
709 #ifndef HAVE_MREMAP
710 #ifdef linux
711 #define HAVE_MREMAP 1
712 #else
713 #define HAVE_MREMAP 0
714 #endif
716 #endif /* HAVE_MMAP */
718 /* Define USE_ARENAS to enable support for multiple `arenas'. These
719 are allocated using mmap(), are necessary for threads and
720 occasionally useful to overcome address space limitations affecting
721 sbrk(). */
723 #ifndef USE_ARENAS
724 #define USE_ARENAS HAVE_MMAP
725 #endif
729 The system page size. To the extent possible, this malloc manages
730 memory from the system in page-size units. Note that this value is
731 cached during initialization into a field of malloc_state. So even
732 if malloc_getpagesize is a function, it is only called once.
734 The following mechanics for getpagesize were adapted from bsd/gnu
735 getpagesize.h. If none of the system-probes here apply, a value of
736 4096 is used, which should be OK: If they don't apply, then using
737 the actual value probably doesn't impact performance.
741 #ifndef malloc_getpagesize
743 #ifndef LACKS_UNISTD_H
744 # include <unistd.h>
745 #endif
747 # ifdef _SC_PAGESIZE /* some SVR4 systems omit an underscore */
748 # ifndef _SC_PAGE_SIZE
749 # define _SC_PAGE_SIZE _SC_PAGESIZE
750 # endif
751 # endif
753 # ifdef _SC_PAGE_SIZE
754 # define malloc_getpagesize sysconf(_SC_PAGE_SIZE)
755 # else
756 # if defined(BSD) || defined(DGUX) || defined(HAVE_GETPAGESIZE)
757 extern size_t getpagesize();
758 # define malloc_getpagesize getpagesize()
759 # else
760 # ifdef WIN32 /* use supplied emulation of getpagesize */
761 # define malloc_getpagesize getpagesize()
762 # else
763 # ifndef LACKS_SYS_PARAM_H
764 # include <sys/param.h>
765 # endif
766 # ifdef EXEC_PAGESIZE
767 # define malloc_getpagesize EXEC_PAGESIZE
768 # else
769 # ifdef NBPG
770 # ifndef CLSIZE
771 # define malloc_getpagesize NBPG
772 # else
773 # define malloc_getpagesize (NBPG * CLSIZE)
774 # endif
775 # else
776 # ifdef NBPC
777 # define malloc_getpagesize NBPC
778 # else
779 # ifdef PAGESIZE
780 # define malloc_getpagesize PAGESIZE
781 # else /* just guess */
782 # define malloc_getpagesize (4096)
783 # endif
784 # endif
785 # endif
786 # endif
787 # endif
788 # endif
789 # endif
790 #endif
793 This version of malloc supports the standard SVID/XPG mallinfo
794 routine that returns a struct containing usage properties and
795 statistics. It should work on any SVID/XPG compliant system that has
796 a /usr/include/malloc.h defining struct mallinfo. (If you'd like to
797 install such a thing yourself, cut out the preliminary declarations
798 as described above and below and save them in a malloc.h file. But
799 there's no compelling reason to bother to do this.)
801 The main declaration needed is the mallinfo struct that is returned
802 (by-copy) by mallinfo(). The SVID/XPG malloinfo struct contains a
803 bunch of fields that are not even meaningful in this version of
804 malloc. These fields are are instead filled by mallinfo() with
805 other numbers that might be of interest.
807 HAVE_USR_INCLUDE_MALLOC_H should be set if you have a
808 /usr/include/malloc.h file that includes a declaration of struct
809 mallinfo. If so, it is included; else an SVID2/XPG2 compliant
810 version is declared below. These must be precisely the same for
811 mallinfo() to work. The original SVID version of this struct,
812 defined on most systems with mallinfo, declares all fields as
813 ints. But some others define as unsigned long. If your system
814 defines the fields using a type of different width than listed here,
815 you must #include your system version and #define
816 HAVE_USR_INCLUDE_MALLOC_H.
819 /* #define HAVE_USR_INCLUDE_MALLOC_H */
821 #ifdef HAVE_USR_INCLUDE_MALLOC_H
822 #include "/usr/include/malloc.h"
823 #endif
826 /* ---------- description of public routines ------------ */
829 malloc(size_t n)
830 Returns a pointer to a newly allocated chunk of at least n bytes, or null
831 if no space is available. Additionally, on failure, errno is
832 set to ENOMEM on ANSI C systems.
834 If n is zero, malloc returns a minumum-sized chunk. (The minimum
835 size is 16 bytes on most 32bit systems, and 24 or 32 bytes on 64bit
836 systems.) On most systems, size_t is an unsigned type, so calls
837 with negative arguments are interpreted as requests for huge amounts
838 of space, which will often fail. The maximum supported value of n
839 differs across systems, but is in all cases less than the maximum
840 representable value of a size_t.
842 #if __STD_C
843 Void_t* public_mALLOc(size_t);
844 #else
845 Void_t* public_mALLOc();
846 #endif
847 #ifdef libc_hidden_proto
848 libc_hidden_proto (public_mALLOc)
849 #endif
852 free(Void_t* p)
853 Releases the chunk of memory pointed to by p, that had been previously
854 allocated using malloc or a related routine such as realloc.
855 It has no effect if p is null. It can have arbitrary (i.e., bad!)
856 effects if p has already been freed.
858 Unless disabled (using mallopt), freeing very large spaces will
859 when possible, automatically trigger operations that give
860 back unused memory to the system, thus reducing program footprint.
862 #if __STD_C
863 void public_fREe(Void_t*);
864 #else
865 void public_fREe();
866 #endif
867 #ifdef libc_hidden_proto
868 libc_hidden_proto (public_fREe)
869 #endif
872 calloc(size_t n_elements, size_t element_size);
873 Returns a pointer to n_elements * element_size bytes, with all locations
874 set to zero.
876 #if __STD_C
877 Void_t* public_cALLOc(size_t, size_t);
878 #else
879 Void_t* public_cALLOc();
880 #endif
883 realloc(Void_t* p, size_t n)
884 Returns a pointer to a chunk of size n that contains the same data
885 as does chunk p up to the minimum of (n, p's size) bytes, or null
886 if no space is available.
888 The returned pointer may or may not be the same as p. The algorithm
889 prefers extending p when possible, otherwise it employs the
890 equivalent of a malloc-copy-free sequence.
892 If p is null, realloc is equivalent to malloc.
894 If space is not available, realloc returns null, errno is set (if on
895 ANSI) and p is NOT freed.
897 if n is for fewer bytes than already held by p, the newly unused
898 space is lopped off and freed if possible. Unless the #define
899 REALLOC_ZERO_BYTES_FREES is set, realloc with a size argument of
900 zero (re)allocates a minimum-sized chunk.
902 Large chunks that were internally obtained via mmap will always
903 be reallocated using malloc-copy-free sequences unless
904 the system supports MREMAP (currently only linux).
906 The old unix realloc convention of allowing the last-free'd chunk
907 to be used as an argument to realloc is not supported.
909 #if __STD_C
910 Void_t* public_rEALLOc(Void_t*, size_t);
911 #else
912 Void_t* public_rEALLOc();
913 #endif
914 #ifdef libc_hidden_proto
915 libc_hidden_proto (public_rEALLOc)
916 #endif
919 memalign(size_t alignment, size_t n);
920 Returns a pointer to a newly allocated chunk of n bytes, aligned
921 in accord with the alignment argument.
923 The alignment argument should be a power of two. If the argument is
924 not a power of two, the nearest greater power is used.
925 8-byte alignment is guaranteed by normal malloc calls, so don't
926 bother calling memalign with an argument of 8 or less.
928 Overreliance on memalign is a sure way to fragment space.
930 #if __STD_C
931 Void_t* public_mEMALIGn(size_t, size_t);
932 #else
933 Void_t* public_mEMALIGn();
934 #endif
935 #ifdef libc_hidden_proto
936 libc_hidden_proto (public_mEMALIGn)
937 #endif
940 valloc(size_t n);
941 Equivalent to memalign(pagesize, n), where pagesize is the page
942 size of the system. If the pagesize is unknown, 4096 is used.
944 #if __STD_C
945 Void_t* public_vALLOc(size_t);
946 #else
947 Void_t* public_vALLOc();
948 #endif
953 mallopt(int parameter_number, int parameter_value)
954 Sets tunable parameters The format is to provide a
955 (parameter-number, parameter-value) pair. mallopt then sets the
956 corresponding parameter to the argument value if it can (i.e., so
957 long as the value is meaningful), and returns 1 if successful else
958 0. SVID/XPG/ANSI defines four standard param numbers for mallopt,
959 normally defined in malloc.h. Only one of these (M_MXFAST) is used
960 in this malloc. The others (M_NLBLKS, M_GRAIN, M_KEEP) don't apply,
961 so setting them has no effect. But this malloc also supports four
962 other options in mallopt. See below for details. Briefly, supported
963 parameters are as follows (listed defaults are for "typical"
964 configurations).
966 Symbol param # default allowed param values
967 M_MXFAST 1 64 0-80 (0 disables fastbins)
968 M_TRIM_THRESHOLD -1 128*1024 any (-1U disables trimming)
969 M_TOP_PAD -2 0 any
970 M_MMAP_THRESHOLD -3 128*1024 any (or 0 if no MMAP support)
971 M_MMAP_MAX -4 65536 any (0 disables use of mmap)
973 #if __STD_C
974 int public_mALLOPt(int, int);
975 #else
976 int public_mALLOPt();
977 #endif
981 mallinfo()
982 Returns (by copy) a struct containing various summary statistics:
984 arena: current total non-mmapped bytes allocated from system
985 ordblks: the number of free chunks
986 smblks: the number of fastbin blocks (i.e., small chunks that
987 have been freed but not use resused or consolidated)
988 hblks: current number of mmapped regions
989 hblkhd: total bytes held in mmapped regions
990 usmblks: the maximum total allocated space. This will be greater
991 than current total if trimming has occurred.
992 fsmblks: total bytes held in fastbin blocks
993 uordblks: current total allocated space (normal or mmapped)
994 fordblks: total free space
995 keepcost: the maximum number of bytes that could ideally be released
996 back to system via malloc_trim. ("ideally" means that
997 it ignores page restrictions etc.)
999 Because these fields are ints, but internal bookkeeping may
1000 be kept as longs, the reported values may wrap around zero and
1001 thus be inaccurate.
1003 #if __STD_C
1004 struct mallinfo public_mALLINFo(void);
1005 #else
1006 struct mallinfo public_mALLINFo();
1007 #endif
1010 independent_calloc(size_t n_elements, size_t element_size, Void_t* chunks[]);
1012 independent_calloc is similar to calloc, but instead of returning a
1013 single cleared space, it returns an array of pointers to n_elements
1014 independent elements that can hold contents of size elem_size, each
1015 of which starts out cleared, and can be independently freed,
1016 realloc'ed etc. The elements are guaranteed to be adjacently
1017 allocated (this is not guaranteed to occur with multiple callocs or
1018 mallocs), which may also improve cache locality in some
1019 applications.
1021 The "chunks" argument is optional (i.e., may be null, which is
1022 probably the most typical usage). If it is null, the returned array
1023 is itself dynamically allocated and should also be freed when it is
1024 no longer needed. Otherwise, the chunks array must be of at least
1025 n_elements in length. It is filled in with the pointers to the
1026 chunks.
1028 In either case, independent_calloc returns this pointer array, or
1029 null if the allocation failed. If n_elements is zero and "chunks"
1030 is null, it returns a chunk representing an array with zero elements
1031 (which should be freed if not wanted).
1033 Each element must be individually freed when it is no longer
1034 needed. If you'd like to instead be able to free all at once, you
1035 should instead use regular calloc and assign pointers into this
1036 space to represent elements. (In this case though, you cannot
1037 independently free elements.)
1039 independent_calloc simplifies and speeds up implementations of many
1040 kinds of pools. It may also be useful when constructing large data
1041 structures that initially have a fixed number of fixed-sized nodes,
1042 but the number is not known at compile time, and some of the nodes
1043 may later need to be freed. For example:
1045 struct Node { int item; struct Node* next; };
1047 struct Node* build_list() {
1048 struct Node** pool;
1049 int n = read_number_of_nodes_needed();
1050 if (n <= 0) return 0;
1051 pool = (struct Node**)(independent_calloc(n, sizeof(struct Node), 0);
1052 if (pool == 0) die();
1053 // organize into a linked list...
1054 struct Node* first = pool[0];
1055 for (i = 0; i < n-1; ++i)
1056 pool[i]->next = pool[i+1];
1057 free(pool); // Can now free the array (or not, if it is needed later)
1058 return first;
1061 #if __STD_C
1062 Void_t** public_iCALLOc(size_t, size_t, Void_t**);
1063 #else
1064 Void_t** public_iCALLOc();
1065 #endif
1068 independent_comalloc(size_t n_elements, size_t sizes[], Void_t* chunks[]);
1070 independent_comalloc allocates, all at once, a set of n_elements
1071 chunks with sizes indicated in the "sizes" array. It returns
1072 an array of pointers to these elements, each of which can be
1073 independently freed, realloc'ed etc. The elements are guaranteed to
1074 be adjacently allocated (this is not guaranteed to occur with
1075 multiple callocs or mallocs), which may also improve cache locality
1076 in some applications.
1078 The "chunks" argument is optional (i.e., may be null). If it is null
1079 the returned array is itself dynamically allocated and should also
1080 be freed when it is no longer needed. Otherwise, the chunks array
1081 must be of at least n_elements in length. It is filled in with the
1082 pointers to the chunks.
1084 In either case, independent_comalloc returns this pointer array, or
1085 null if the allocation failed. If n_elements is zero and chunks is
1086 null, it returns a chunk representing an array with zero elements
1087 (which should be freed if not wanted).
1089 Each element must be individually freed when it is no longer
1090 needed. If you'd like to instead be able to free all at once, you
1091 should instead use a single regular malloc, and assign pointers at
1092 particular offsets in the aggregate space. (In this case though, you
1093 cannot independently free elements.)
1095 independent_comallac differs from independent_calloc in that each
1096 element may have a different size, and also that it does not
1097 automatically clear elements.
1099 independent_comalloc can be used to speed up allocation in cases
1100 where several structs or objects must always be allocated at the
1101 same time. For example:
1103 struct Head { ... }
1104 struct Foot { ... }
1106 void send_message(char* msg) {
1107 int msglen = strlen(msg);
1108 size_t sizes[3] = { sizeof(struct Head), msglen, sizeof(struct Foot) };
1109 void* chunks[3];
1110 if (independent_comalloc(3, sizes, chunks) == 0)
1111 die();
1112 struct Head* head = (struct Head*)(chunks[0]);
1113 char* body = (char*)(chunks[1]);
1114 struct Foot* foot = (struct Foot*)(chunks[2]);
1115 // ...
1118 In general though, independent_comalloc is worth using only for
1119 larger values of n_elements. For small values, you probably won't
1120 detect enough difference from series of malloc calls to bother.
1122 Overuse of independent_comalloc can increase overall memory usage,
1123 since it cannot reuse existing noncontiguous small chunks that
1124 might be available for some of the elements.
1126 #if __STD_C
1127 Void_t** public_iCOMALLOc(size_t, size_t*, Void_t**);
1128 #else
1129 Void_t** public_iCOMALLOc();
1130 #endif
1134 pvalloc(size_t n);
1135 Equivalent to valloc(minimum-page-that-holds(n)), that is,
1136 round up n to nearest pagesize.
1138 #if __STD_C
1139 Void_t* public_pVALLOc(size_t);
1140 #else
1141 Void_t* public_pVALLOc();
1142 #endif
1145 cfree(Void_t* p);
1146 Equivalent to free(p).
1148 cfree is needed/defined on some systems that pair it with calloc,
1149 for odd historical reasons (such as: cfree is used in example
1150 code in the first edition of K&R).
1152 #if __STD_C
1153 void public_cFREe(Void_t*);
1154 #else
1155 void public_cFREe();
1156 #endif
1159 malloc_trim(size_t pad);
1161 If possible, gives memory back to the system (via negative
1162 arguments to sbrk) if there is unused memory at the `high' end of
1163 the malloc pool. You can call this after freeing large blocks of
1164 memory to potentially reduce the system-level memory requirements
1165 of a program. However, it cannot guarantee to reduce memory. Under
1166 some allocation patterns, some large free blocks of memory will be
1167 locked between two used chunks, so they cannot be given back to
1168 the system.
1170 The `pad' argument to malloc_trim represents the amount of free
1171 trailing space to leave untrimmed. If this argument is zero,
1172 only the minimum amount of memory to maintain internal data
1173 structures will be left (one page or less). Non-zero arguments
1174 can be supplied to maintain enough trailing space to service
1175 future expected allocations without having to re-obtain memory
1176 from the system.
1178 Malloc_trim returns 1 if it actually released any memory, else 0.
1179 On systems that do not support "negative sbrks", it will always
1180 rreturn 0.
1182 #if __STD_C
1183 int public_mTRIm(size_t);
1184 #else
1185 int public_mTRIm();
1186 #endif
1189 malloc_usable_size(Void_t* p);
1191 Returns the number of bytes you can actually use in
1192 an allocated chunk, which may be more than you requested (although
1193 often not) due to alignment and minimum size constraints.
1194 You can use this many bytes without worrying about
1195 overwriting other allocated objects. This is not a particularly great
1196 programming practice. malloc_usable_size can be more useful in
1197 debugging and assertions, for example:
1199 p = malloc(n);
1200 assert(malloc_usable_size(p) >= 256);
1203 #if __STD_C
1204 size_t public_mUSABLe(Void_t*);
1205 #else
1206 size_t public_mUSABLe();
1207 #endif
1210 malloc_stats();
1211 Prints on stderr the amount of space obtained from the system (both
1212 via sbrk and mmap), the maximum amount (which may be more than
1213 current if malloc_trim and/or munmap got called), and the current
1214 number of bytes allocated via malloc (or realloc, etc) but not yet
1215 freed. Note that this is the number of bytes allocated, not the
1216 number requested. It will be larger than the number requested
1217 because of alignment and bookkeeping overhead. Because it includes
1218 alignment wastage as being in use, this figure may be greater than
1219 zero even when no user-level chunks are allocated.
1221 The reported current and maximum system memory can be inaccurate if
1222 a program makes other calls to system memory allocation functions
1223 (normally sbrk) outside of malloc.
1225 malloc_stats prints only the most commonly interesting statistics.
1226 More information can be obtained by calling mallinfo.
1229 #if __STD_C
1230 void public_mSTATs(void);
1231 #else
1232 void public_mSTATs();
1233 #endif
1236 malloc_get_state(void);
1238 Returns the state of all malloc variables in an opaque data
1239 structure.
1241 #if __STD_C
1242 Void_t* public_gET_STATe(void);
1243 #else
1244 Void_t* public_gET_STATe();
1245 #endif
1248 malloc_set_state(Void_t* state);
1250 Restore the state of all malloc variables from data obtained with
1251 malloc_get_state().
1253 #if __STD_C
1254 int public_sET_STATe(Void_t*);
1255 #else
1256 int public_sET_STATe();
1257 #endif
1259 #ifdef _LIBC
1261 posix_memalign(void **memptr, size_t alignment, size_t size);
1263 POSIX wrapper like memalign(), checking for validity of size.
1265 int __posix_memalign(void **, size_t, size_t);
1266 #endif
1268 /* mallopt tuning options */
1271 M_MXFAST is the maximum request size used for "fastbins", special bins
1272 that hold returned chunks without consolidating their spaces. This
1273 enables future requests for chunks of the same size to be handled
1274 very quickly, but can increase fragmentation, and thus increase the
1275 overall memory footprint of a program.
1277 This malloc manages fastbins very conservatively yet still
1278 efficiently, so fragmentation is rarely a problem for values less
1279 than or equal to the default. The maximum supported value of MXFAST
1280 is 80. You wouldn't want it any higher than this anyway. Fastbins
1281 are designed especially for use with many small structs, objects or
1282 strings -- the default handles structs/objects/arrays with sizes up
1283 to 8 4byte fields, or small strings representing words, tokens,
1284 etc. Using fastbins for larger objects normally worsens
1285 fragmentation without improving speed.
1287 M_MXFAST is set in REQUEST size units. It is internally used in
1288 chunksize units, which adds padding and alignment. You can reduce
1289 M_MXFAST to 0 to disable all use of fastbins. This causes the malloc
1290 algorithm to be a closer approximation of fifo-best-fit in all cases,
1291 not just for larger requests, but will generally cause it to be
1292 slower.
1296 /* M_MXFAST is a standard SVID/XPG tuning option, usually listed in malloc.h */
1297 #ifndef M_MXFAST
1298 #define M_MXFAST 1
1299 #endif
1301 #ifndef DEFAULT_MXFAST
1302 #define DEFAULT_MXFAST 64
1303 #endif
1307 M_TRIM_THRESHOLD is the maximum amount of unused top-most memory
1308 to keep before releasing via malloc_trim in free().
1310 Automatic trimming is mainly useful in long-lived programs.
1311 Because trimming via sbrk can be slow on some systems, and can
1312 sometimes be wasteful (in cases where programs immediately
1313 afterward allocate more large chunks) the value should be high
1314 enough so that your overall system performance would improve by
1315 releasing this much memory.
1317 The trim threshold and the mmap control parameters (see below)
1318 can be traded off with one another. Trimming and mmapping are
1319 two different ways of releasing unused memory back to the
1320 system. Between these two, it is often possible to keep
1321 system-level demands of a long-lived program down to a bare
1322 minimum. For example, in one test suite of sessions measuring
1323 the XF86 X server on Linux, using a trim threshold of 128K and a
1324 mmap threshold of 192K led to near-minimal long term resource
1325 consumption.
1327 If you are using this malloc in a long-lived program, it should
1328 pay to experiment with these values. As a rough guide, you
1329 might set to a value close to the average size of a process
1330 (program) running on your system. Releasing this much memory
1331 would allow such a process to run in memory. Generally, it's
1332 worth it to tune for trimming rather tham memory mapping when a
1333 program undergoes phases where several large chunks are
1334 allocated and released in ways that can reuse each other's
1335 storage, perhaps mixed with phases where there are no such
1336 chunks at all. And in well-behaved long-lived programs,
1337 controlling release of large blocks via trimming versus mapping
1338 is usually faster.
1340 However, in most programs, these parameters serve mainly as
1341 protection against the system-level effects of carrying around
1342 massive amounts of unneeded memory. Since frequent calls to
1343 sbrk, mmap, and munmap otherwise degrade performance, the default
1344 parameters are set to relatively high values that serve only as
1345 safeguards.
1347 The trim value It must be greater than page size to have any useful
1348 effect. To disable trimming completely, you can set to
1349 (unsigned long)(-1)
1351 Trim settings interact with fastbin (MXFAST) settings: Unless
1352 TRIM_FASTBINS is defined, automatic trimming never takes place upon
1353 freeing a chunk with size less than or equal to MXFAST. Trimming is
1354 instead delayed until subsequent freeing of larger chunks. However,
1355 you can still force an attempted trim by calling malloc_trim.
1357 Also, trimming is not generally possible in cases where
1358 the main arena is obtained via mmap.
1360 Note that the trick some people use of mallocing a huge space and
1361 then freeing it at program startup, in an attempt to reserve system
1362 memory, doesn't have the intended effect under automatic trimming,
1363 since that memory will immediately be returned to the system.
1366 #define M_TRIM_THRESHOLD -1
1368 #ifndef DEFAULT_TRIM_THRESHOLD
1369 #define DEFAULT_TRIM_THRESHOLD (128 * 1024)
1370 #endif
1373 M_TOP_PAD is the amount of extra `padding' space to allocate or
1374 retain whenever sbrk is called. It is used in two ways internally:
1376 * When sbrk is called to extend the top of the arena to satisfy
1377 a new malloc request, this much padding is added to the sbrk
1378 request.
1380 * When malloc_trim is called automatically from free(),
1381 it is used as the `pad' argument.
1383 In both cases, the actual amount of padding is rounded
1384 so that the end of the arena is always a system page boundary.
1386 The main reason for using padding is to avoid calling sbrk so
1387 often. Having even a small pad greatly reduces the likelihood
1388 that nearly every malloc request during program start-up (or
1389 after trimming) will invoke sbrk, which needlessly wastes
1390 time.
1392 Automatic rounding-up to page-size units is normally sufficient
1393 to avoid measurable overhead, so the default is 0. However, in
1394 systems where sbrk is relatively slow, it can pay to increase
1395 this value, at the expense of carrying around more memory than
1396 the program needs.
1399 #define M_TOP_PAD -2
1401 #ifndef DEFAULT_TOP_PAD
1402 #define DEFAULT_TOP_PAD (0)
1403 #endif
1406 M_MMAP_THRESHOLD is the request size threshold for using mmap()
1407 to service a request. Requests of at least this size that cannot
1408 be allocated using already-existing space will be serviced via mmap.
1409 (If enough normal freed space already exists it is used instead.)
1411 Using mmap segregates relatively large chunks of memory so that
1412 they can be individually obtained and released from the host
1413 system. A request serviced through mmap is never reused by any
1414 other request (at least not directly; the system may just so
1415 happen to remap successive requests to the same locations).
1417 Segregating space in this way has the benefits that:
1419 1. Mmapped space can ALWAYS be individually released back
1420 to the system, which helps keep the system level memory
1421 demands of a long-lived program low.
1422 2. Mapped memory can never become `locked' between
1423 other chunks, as can happen with normally allocated chunks, which
1424 means that even trimming via malloc_trim would not release them.
1425 3. On some systems with "holes" in address spaces, mmap can obtain
1426 memory that sbrk cannot.
1428 However, it has the disadvantages that:
1430 1. The space cannot be reclaimed, consolidated, and then
1431 used to service later requests, as happens with normal chunks.
1432 2. It can lead to more wastage because of mmap page alignment
1433 requirements
1434 3. It causes malloc performance to be more dependent on host
1435 system memory management support routines which may vary in
1436 implementation quality and may impose arbitrary
1437 limitations. Generally, servicing a request via normal
1438 malloc steps is faster than going through a system's mmap.
1440 The advantages of mmap nearly always outweigh disadvantages for
1441 "large" chunks, but the value of "large" varies across systems. The
1442 default is an empirically derived value that works well in most
1443 systems.
1446 #define M_MMAP_THRESHOLD -3
1448 #ifndef DEFAULT_MMAP_THRESHOLD
1449 #define DEFAULT_MMAP_THRESHOLD (128 * 1024)
1450 #endif
1453 M_MMAP_MAX is the maximum number of requests to simultaneously
1454 service using mmap. This parameter exists because
1455 some systems have a limited number of internal tables for
1456 use by mmap, and using more than a few of them may degrade
1457 performance.
1459 The default is set to a value that serves only as a safeguard.
1460 Setting to 0 disables use of mmap for servicing large requests. If
1461 HAVE_MMAP is not set, the default value is 0, and attempts to set it
1462 to non-zero values in mallopt will fail.
1465 #define M_MMAP_MAX -4
1467 #ifndef DEFAULT_MMAP_MAX
1468 #if HAVE_MMAP
1469 #define DEFAULT_MMAP_MAX (65536)
1470 #else
1471 #define DEFAULT_MMAP_MAX (0)
1472 #endif
1473 #endif
1475 #ifdef __cplusplus
1476 } /* end of extern "C" */
1477 #endif
1479 #include <malloc.h>
1481 #ifndef BOUNDED_N
1482 #define BOUNDED_N(ptr, sz) (ptr)
1483 #endif
1484 #ifndef RETURN_ADDRESS
1485 #define RETURN_ADDRESS(X_) (NULL)
1486 #endif
1488 /* On some platforms we can compile internal, not exported functions better.
1489 Let the environment provide a macro and define it to be empty if it
1490 is not available. */
1491 #ifndef internal_function
1492 # define internal_function
1493 #endif
1495 /* Forward declarations. */
1496 struct malloc_chunk;
1497 typedef struct malloc_chunk* mchunkptr;
1499 /* Internal routines. */
1501 #if __STD_C
1503 Void_t* _int_malloc(mstate, size_t);
1504 void _int_free(mstate, Void_t*);
1505 Void_t* _int_realloc(mstate, Void_t*, size_t);
1506 Void_t* _int_memalign(mstate, size_t, size_t);
1507 Void_t* _int_valloc(mstate, size_t);
1508 static Void_t* _int_pvalloc(mstate, size_t);
1509 /*static Void_t* cALLOc(size_t, size_t);*/
1510 static Void_t** _int_icalloc(mstate, size_t, size_t, Void_t**);
1511 static Void_t** _int_icomalloc(mstate, size_t, size_t*, Void_t**);
1512 static int mTRIm(size_t);
1513 static size_t mUSABLe(Void_t*);
1514 static void mSTATs(void);
1515 static int mALLOPt(int, int);
1516 static struct mallinfo mALLINFo(mstate);
1517 static void malloc_printerr(int action, const char *str, void *ptr);
1519 static Void_t* internal_function mem2mem_check(Void_t *p, size_t sz);
1520 static int internal_function top_check(void);
1521 static void internal_function munmap_chunk(mchunkptr p);
1522 #if HAVE_MREMAP
1523 static mchunkptr internal_function mremap_chunk(mchunkptr p, size_t new_size);
1524 #endif
1526 static Void_t* malloc_check(size_t sz, const Void_t *caller);
1527 static void free_check(Void_t* mem, const Void_t *caller);
1528 static Void_t* realloc_check(Void_t* oldmem, size_t bytes,
1529 const Void_t *caller);
1530 static Void_t* memalign_check(size_t alignment, size_t bytes,
1531 const Void_t *caller);
1532 #ifndef NO_THREADS
1533 # ifdef _LIBC
1534 # if USE___THREAD || (defined USE_TLS && !defined SHARED)
1535 /* These routines are never needed in this configuration. */
1536 # define NO_STARTER
1537 # endif
1538 # endif
1539 # ifdef NO_STARTER
1540 # undef NO_STARTER
1541 # else
1542 static Void_t* malloc_starter(size_t sz, const Void_t *caller);
1543 static Void_t* memalign_starter(size_t aln, size_t sz, const Void_t *caller);
1544 static void free_starter(Void_t* mem, const Void_t *caller);
1545 # endif
1546 static Void_t* malloc_atfork(size_t sz, const Void_t *caller);
1547 static void free_atfork(Void_t* mem, const Void_t *caller);
1548 #endif
1550 #else
1552 Void_t* _int_malloc();
1553 void _int_free();
1554 Void_t* _int_realloc();
1555 Void_t* _int_memalign();
1556 Void_t* _int_valloc();
1557 Void_t* _int_pvalloc();
1558 /*static Void_t* cALLOc();*/
1559 static Void_t** _int_icalloc();
1560 static Void_t** _int_icomalloc();
1561 static int mTRIm();
1562 static size_t mUSABLe();
1563 static void mSTATs();
1564 static int mALLOPt();
1565 static struct mallinfo mALLINFo();
1567 #endif
1572 /* ------------- Optional versions of memcopy ---------------- */
1575 #if USE_MEMCPY
1578 Note: memcpy is ONLY invoked with non-overlapping regions,
1579 so the (usually slower) memmove is not needed.
1582 #define MALLOC_COPY(dest, src, nbytes) memcpy(dest, src, nbytes)
1583 #define MALLOC_ZERO(dest, nbytes) memset(dest, 0, nbytes)
1585 #else /* !USE_MEMCPY */
1587 /* Use Duff's device for good zeroing/copying performance. */
1589 #define MALLOC_ZERO(charp, nbytes) \
1590 do { \
1591 INTERNAL_SIZE_T* mzp = (INTERNAL_SIZE_T*)(charp); \
1592 unsigned long mctmp = (nbytes)/sizeof(INTERNAL_SIZE_T); \
1593 long mcn; \
1594 if (mctmp < 8) mcn = 0; else { mcn = (mctmp-1)/8; mctmp %= 8; } \
1595 switch (mctmp) { \
1596 case 0: for(;;) { *mzp++ = 0; \
1597 case 7: *mzp++ = 0; \
1598 case 6: *mzp++ = 0; \
1599 case 5: *mzp++ = 0; \
1600 case 4: *mzp++ = 0; \
1601 case 3: *mzp++ = 0; \
1602 case 2: *mzp++ = 0; \
1603 case 1: *mzp++ = 0; if(mcn <= 0) break; mcn--; } \
1605 } while(0)
1607 #define MALLOC_COPY(dest,src,nbytes) \
1608 do { \
1609 INTERNAL_SIZE_T* mcsrc = (INTERNAL_SIZE_T*) src; \
1610 INTERNAL_SIZE_T* mcdst = (INTERNAL_SIZE_T*) dest; \
1611 unsigned long mctmp = (nbytes)/sizeof(INTERNAL_SIZE_T); \
1612 long mcn; \
1613 if (mctmp < 8) mcn = 0; else { mcn = (mctmp-1)/8; mctmp %= 8; } \
1614 switch (mctmp) { \
1615 case 0: for(;;) { *mcdst++ = *mcsrc++; \
1616 case 7: *mcdst++ = *mcsrc++; \
1617 case 6: *mcdst++ = *mcsrc++; \
1618 case 5: *mcdst++ = *mcsrc++; \
1619 case 4: *mcdst++ = *mcsrc++; \
1620 case 3: *mcdst++ = *mcsrc++; \
1621 case 2: *mcdst++ = *mcsrc++; \
1622 case 1: *mcdst++ = *mcsrc++; if(mcn <= 0) break; mcn--; } \
1624 } while(0)
1626 #endif
1628 /* ------------------ MMAP support ------------------ */
1631 #if HAVE_MMAP
1633 #include <fcntl.h>
1634 #ifndef LACKS_SYS_MMAN_H
1635 #include <sys/mman.h>
1636 #endif
1638 #if !defined(MAP_ANONYMOUS) && defined(MAP_ANON)
1639 # define MAP_ANONYMOUS MAP_ANON
1640 #endif
1641 #if !defined(MAP_FAILED)
1642 # define MAP_FAILED ((char*)-1)
1643 #endif
1645 #ifndef MAP_NORESERVE
1646 # ifdef MAP_AUTORESRV
1647 # define MAP_NORESERVE MAP_AUTORESRV
1648 # else
1649 # define MAP_NORESERVE 0
1650 # endif
1651 #endif
1654 Nearly all versions of mmap support MAP_ANONYMOUS,
1655 so the following is unlikely to be needed, but is
1656 supplied just in case.
1659 #ifndef MAP_ANONYMOUS
1661 static int dev_zero_fd = -1; /* Cached file descriptor for /dev/zero. */
1663 #define MMAP(addr, size, prot, flags) ((dev_zero_fd < 0) ? \
1664 (dev_zero_fd = open("/dev/zero", O_RDWR), \
1665 mmap((addr), (size), (prot), (flags), dev_zero_fd, 0)) : \
1666 mmap((addr), (size), (prot), (flags), dev_zero_fd, 0))
1668 #else
1670 #define MMAP(addr, size, prot, flags) \
1671 (mmap((addr), (size), (prot), (flags)|MAP_ANONYMOUS, -1, 0))
1673 #endif
1676 #endif /* HAVE_MMAP */
1680 ----------------------- Chunk representations -----------------------
1685 This struct declaration is misleading (but accurate and necessary).
1686 It declares a "view" into memory allowing access to necessary
1687 fields at known offsets from a given base. See explanation below.
1690 struct malloc_chunk {
1692 INTERNAL_SIZE_T prev_size; /* Size of previous chunk (if free). */
1693 INTERNAL_SIZE_T size; /* Size in bytes, including overhead. */
1695 struct malloc_chunk* fd; /* double links -- used only if free. */
1696 struct malloc_chunk* bk;
1701 malloc_chunk details:
1703 (The following includes lightly edited explanations by Colin Plumb.)
1705 Chunks of memory are maintained using a `boundary tag' method as
1706 described in e.g., Knuth or Standish. (See the paper by Paul
1707 Wilson ftp://ftp.cs.utexas.edu/pub/garbage/allocsrv.ps for a
1708 survey of such techniques.) Sizes of free chunks are stored both
1709 in the front of each chunk and at the end. This makes
1710 consolidating fragmented chunks into bigger chunks very fast. The
1711 size fields also hold bits representing whether chunks are free or
1712 in use.
1714 An allocated chunk looks like this:
1717 chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1718 | Size of previous chunk, if allocated | |
1719 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1720 | Size of chunk, in bytes |M|P|
1721 mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1722 | User data starts here... .
1724 . (malloc_usable_space() bytes) .
1726 nextchunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1727 | Size of chunk |
1728 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1731 Where "chunk" is the front of the chunk for the purpose of most of
1732 the malloc code, but "mem" is the pointer that is returned to the
1733 user. "Nextchunk" is the beginning of the next contiguous chunk.
1735 Chunks always begin on even word boundries, so the mem portion
1736 (which is returned to the user) is also on an even word boundary, and
1737 thus at least double-word aligned.
1739 Free chunks are stored in circular doubly-linked lists, and look like this:
1741 chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1742 | Size of previous chunk |
1743 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1744 `head:' | Size of chunk, in bytes |P|
1745 mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1746 | Forward pointer to next chunk in list |
1747 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1748 | Back pointer to previous chunk in list |
1749 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1750 | Unused space (may be 0 bytes long) .
1753 nextchunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1754 `foot:' | Size of chunk, in bytes |
1755 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1757 The P (PREV_INUSE) bit, stored in the unused low-order bit of the
1758 chunk size (which is always a multiple of two words), is an in-use
1759 bit for the *previous* chunk. If that bit is *clear*, then the
1760 word before the current chunk size contains the previous chunk
1761 size, and can be used to find the front of the previous chunk.
1762 The very first chunk allocated always has this bit set,
1763 preventing access to non-existent (or non-owned) memory. If
1764 prev_inuse is set for any given chunk, then you CANNOT determine
1765 the size of the previous chunk, and might even get a memory
1766 addressing fault when trying to do so.
1768 Note that the `foot' of the current chunk is actually represented
1769 as the prev_size of the NEXT chunk. This makes it easier to
1770 deal with alignments etc but can be very confusing when trying
1771 to extend or adapt this code.
1773 The two exceptions to all this are
1775 1. The special chunk `top' doesn't bother using the
1776 trailing size field since there is no next contiguous chunk
1777 that would have to index off it. After initialization, `top'
1778 is forced to always exist. If it would become less than
1779 MINSIZE bytes long, it is replenished.
1781 2. Chunks allocated via mmap, which have the second-lowest-order
1782 bit M (IS_MMAPPED) set in their size fields. Because they are
1783 allocated one-by-one, each must contain its own trailing size field.
1788 ---------- Size and alignment checks and conversions ----------
1791 /* conversion from malloc headers to user pointers, and back */
1793 #define chunk2mem(p) ((Void_t*)((char*)(p) + 2*SIZE_SZ))
1794 #define mem2chunk(mem) ((mchunkptr)((char*)(mem) - 2*SIZE_SZ))
1796 /* The smallest possible chunk */
1797 #define MIN_CHUNK_SIZE (sizeof(struct malloc_chunk))
1799 /* The smallest size we can malloc is an aligned minimal chunk */
1801 #define MINSIZE \
1802 (unsigned long)(((MIN_CHUNK_SIZE+MALLOC_ALIGN_MASK) & ~MALLOC_ALIGN_MASK))
1804 /* Check if m has acceptable alignment */
1806 #define aligned_OK(m) (((unsigned long)((m)) & (MALLOC_ALIGN_MASK)) == 0)
1810 Check if a request is so large that it would wrap around zero when
1811 padded and aligned. To simplify some other code, the bound is made
1812 low enough so that adding MINSIZE will also not wrap around zero.
1815 #define REQUEST_OUT_OF_RANGE(req) \
1816 ((unsigned long)(req) >= \
1817 (unsigned long)(INTERNAL_SIZE_T)(-2 * MINSIZE))
1819 /* pad request bytes into a usable size -- internal version */
1821 #define request2size(req) \
1822 (((req) + SIZE_SZ + MALLOC_ALIGN_MASK < MINSIZE) ? \
1823 MINSIZE : \
1824 ((req) + SIZE_SZ + MALLOC_ALIGN_MASK) & ~MALLOC_ALIGN_MASK)
1826 /* Same, except also perform argument check */
1828 #define checked_request2size(req, sz) \
1829 if (REQUEST_OUT_OF_RANGE(req)) { \
1830 MALLOC_FAILURE_ACTION; \
1831 return 0; \
1833 (sz) = request2size(req);
1836 --------------- Physical chunk operations ---------------
1840 /* size field is or'ed with PREV_INUSE when previous adjacent chunk in use */
1841 #define PREV_INUSE 0x1
1843 /* extract inuse bit of previous chunk */
1844 #define prev_inuse(p) ((p)->size & PREV_INUSE)
1847 /* size field is or'ed with IS_MMAPPED if the chunk was obtained with mmap() */
1848 #define IS_MMAPPED 0x2
1850 /* check for mmap()'ed chunk */
1851 #define chunk_is_mmapped(p) ((p)->size & IS_MMAPPED)
1854 /* size field is or'ed with NON_MAIN_ARENA if the chunk was obtained
1855 from a non-main arena. This is only set immediately before handing
1856 the chunk to the user, if necessary. */
1857 #define NON_MAIN_ARENA 0x4
1859 /* check for chunk from non-main arena */
1860 #define chunk_non_main_arena(p) ((p)->size & NON_MAIN_ARENA)
1864 Bits to mask off when extracting size
1866 Note: IS_MMAPPED is intentionally not masked off from size field in
1867 macros for which mmapped chunks should never be seen. This should
1868 cause helpful core dumps to occur if it is tried by accident by
1869 people extending or adapting this malloc.
1871 #define SIZE_BITS (PREV_INUSE|IS_MMAPPED|NON_MAIN_ARENA)
1873 /* Get size, ignoring use bits */
1874 #define chunksize(p) ((p)->size & ~(SIZE_BITS))
1877 /* Ptr to next physical malloc_chunk. */
1878 #define next_chunk(p) ((mchunkptr)( ((char*)(p)) + ((p)->size & ~SIZE_BITS) ))
1880 /* Ptr to previous physical malloc_chunk */
1881 #define prev_chunk(p) ((mchunkptr)( ((char*)(p)) - ((p)->prev_size) ))
1883 /* Treat space at ptr + offset as a chunk */
1884 #define chunk_at_offset(p, s) ((mchunkptr)(((char*)(p)) + (s)))
1886 /* extract p's inuse bit */
1887 #define inuse(p)\
1888 ((((mchunkptr)(((char*)(p))+((p)->size & ~SIZE_BITS)))->size) & PREV_INUSE)
1890 /* set/clear chunk as being inuse without otherwise disturbing */
1891 #define set_inuse(p)\
1892 ((mchunkptr)(((char*)(p)) + ((p)->size & ~SIZE_BITS)))->size |= PREV_INUSE
1894 #define clear_inuse(p)\
1895 ((mchunkptr)(((char*)(p)) + ((p)->size & ~SIZE_BITS)))->size &= ~(PREV_INUSE)
1898 /* check/set/clear inuse bits in known places */
1899 #define inuse_bit_at_offset(p, s)\
1900 (((mchunkptr)(((char*)(p)) + (s)))->size & PREV_INUSE)
1902 #define set_inuse_bit_at_offset(p, s)\
1903 (((mchunkptr)(((char*)(p)) + (s)))->size |= PREV_INUSE)
1905 #define clear_inuse_bit_at_offset(p, s)\
1906 (((mchunkptr)(((char*)(p)) + (s)))->size &= ~(PREV_INUSE))
1909 /* Set size at head, without disturbing its use bit */
1910 #define set_head_size(p, s) ((p)->size = (((p)->size & SIZE_BITS) | (s)))
1912 /* Set size/use field */
1913 #define set_head(p, s) ((p)->size = (s))
1915 /* Set size at footer (only when chunk is not in use) */
1916 #define set_foot(p, s) (((mchunkptr)((char*)(p) + (s)))->prev_size = (s))
1920 -------------------- Internal data structures --------------------
1922 All internal state is held in an instance of malloc_state defined
1923 below. There are no other static variables, except in two optional
1924 cases:
1925 * If USE_MALLOC_LOCK is defined, the mALLOC_MUTEx declared above.
1926 * If HAVE_MMAP is true, but mmap doesn't support
1927 MAP_ANONYMOUS, a dummy file descriptor for mmap.
1929 Beware of lots of tricks that minimize the total bookkeeping space
1930 requirements. The result is a little over 1K bytes (for 4byte
1931 pointers and size_t.)
1935 Bins
1937 An array of bin headers for free chunks. Each bin is doubly
1938 linked. The bins are approximately proportionally (log) spaced.
1939 There are a lot of these bins (128). This may look excessive, but
1940 works very well in practice. Most bins hold sizes that are
1941 unusual as malloc request sizes, but are more usual for fragments
1942 and consolidated sets of chunks, which is what these bins hold, so
1943 they can be found quickly. All procedures maintain the invariant
1944 that no consolidated chunk physically borders another one, so each
1945 chunk in a list is known to be preceeded and followed by either
1946 inuse chunks or the ends of memory.
1948 Chunks in bins are kept in size order, with ties going to the
1949 approximately least recently used chunk. Ordering isn't needed
1950 for the small bins, which all contain the same-sized chunks, but
1951 facilitates best-fit allocation for larger chunks. These lists
1952 are just sequential. Keeping them in order almost never requires
1953 enough traversal to warrant using fancier ordered data
1954 structures.
1956 Chunks of the same size are linked with the most
1957 recently freed at the front, and allocations are taken from the
1958 back. This results in LRU (FIFO) allocation order, which tends
1959 to give each chunk an equal opportunity to be consolidated with
1960 adjacent freed chunks, resulting in larger free chunks and less
1961 fragmentation.
1963 To simplify use in double-linked lists, each bin header acts
1964 as a malloc_chunk. This avoids special-casing for headers.
1965 But to conserve space and improve locality, we allocate
1966 only the fd/bk pointers of bins, and then use repositioning tricks
1967 to treat these as the fields of a malloc_chunk*.
1970 typedef struct malloc_chunk* mbinptr;
1972 /* addressing -- note that bin_at(0) does not exist */
1973 #define bin_at(m, i) ((mbinptr)((char*)&((m)->bins[(i)<<1]) - (SIZE_SZ<<1)))
1975 /* analog of ++bin */
1976 #define next_bin(b) ((mbinptr)((char*)(b) + (sizeof(mchunkptr)<<1)))
1978 /* Reminders about list directionality within bins */
1979 #define first(b) ((b)->fd)
1980 #define last(b) ((b)->bk)
1982 /* Take a chunk off a bin list */
1983 #define unlink(P, BK, FD) { \
1984 FD = P->fd; \
1985 BK = P->bk; \
1986 if (__builtin_expect (FD->bk != P || BK->fd != P, 0)) \
1987 malloc_printerr (check_action, "corrupted double-linked list", P); \
1988 else { \
1989 FD->bk = BK; \
1990 BK->fd = FD; \
1995 Indexing
1997 Bins for sizes < 512 bytes contain chunks of all the same size, spaced
1998 8 bytes apart. Larger bins are approximately logarithmically spaced:
2000 64 bins of size 8
2001 32 bins of size 64
2002 16 bins of size 512
2003 8 bins of size 4096
2004 4 bins of size 32768
2005 2 bins of size 262144
2006 1 bin of size what's left
2008 There is actually a little bit of slop in the numbers in bin_index
2009 for the sake of speed. This makes no difference elsewhere.
2011 The bins top out around 1MB because we expect to service large
2012 requests via mmap.
2015 #define NBINS 128
2016 #define NSMALLBINS 64
2017 #define SMALLBIN_WIDTH 8
2018 #define MIN_LARGE_SIZE 512
2020 #define in_smallbin_range(sz) \
2021 ((unsigned long)(sz) < (unsigned long)MIN_LARGE_SIZE)
2023 #define smallbin_index(sz) (((unsigned)(sz)) >> 3)
2025 #define largebin_index(sz) \
2026 (((((unsigned long)(sz)) >> 6) <= 32)? 56 + (((unsigned long)(sz)) >> 6): \
2027 ((((unsigned long)(sz)) >> 9) <= 20)? 91 + (((unsigned long)(sz)) >> 9): \
2028 ((((unsigned long)(sz)) >> 12) <= 10)? 110 + (((unsigned long)(sz)) >> 12): \
2029 ((((unsigned long)(sz)) >> 15) <= 4)? 119 + (((unsigned long)(sz)) >> 15): \
2030 ((((unsigned long)(sz)) >> 18) <= 2)? 124 + (((unsigned long)(sz)) >> 18): \
2031 126)
2033 #define bin_index(sz) \
2034 ((in_smallbin_range(sz)) ? smallbin_index(sz) : largebin_index(sz))
2038 Unsorted chunks
2040 All remainders from chunk splits, as well as all returned chunks,
2041 are first placed in the "unsorted" bin. They are then placed
2042 in regular bins after malloc gives them ONE chance to be used before
2043 binning. So, basically, the unsorted_chunks list acts as a queue,
2044 with chunks being placed on it in free (and malloc_consolidate),
2045 and taken off (to be either used or placed in bins) in malloc.
2047 The NON_MAIN_ARENA flag is never set for unsorted chunks, so it
2048 does not have to be taken into account in size comparisons.
2051 /* The otherwise unindexable 1-bin is used to hold unsorted chunks. */
2052 #define unsorted_chunks(M) (bin_at(M, 1))
2057 The top-most available chunk (i.e., the one bordering the end of
2058 available memory) is treated specially. It is never included in
2059 any bin, is used only if no other chunk is available, and is
2060 released back to the system if it is very large (see
2061 M_TRIM_THRESHOLD). Because top initially
2062 points to its own bin with initial zero size, thus forcing
2063 extension on the first malloc request, we avoid having any special
2064 code in malloc to check whether it even exists yet. But we still
2065 need to do so when getting memory from system, so we make
2066 initial_top treat the bin as a legal but unusable chunk during the
2067 interval between initialization and the first call to
2068 sYSMALLOc. (This is somewhat delicate, since it relies on
2069 the 2 preceding words to be zero during this interval as well.)
2072 /* Conveniently, the unsorted bin can be used as dummy top on first call */
2073 #define initial_top(M) (unsorted_chunks(M))
2076 Binmap
2078 To help compensate for the large number of bins, a one-level index
2079 structure is used for bin-by-bin searching. `binmap' is a
2080 bitvector recording whether bins are definitely empty so they can
2081 be skipped over during during traversals. The bits are NOT always
2082 cleared as soon as bins are empty, but instead only
2083 when they are noticed to be empty during traversal in malloc.
2086 /* Conservatively use 32 bits per map word, even if on 64bit system */
2087 #define BINMAPSHIFT 5
2088 #define BITSPERMAP (1U << BINMAPSHIFT)
2089 #define BINMAPSIZE (NBINS / BITSPERMAP)
2091 #define idx2block(i) ((i) >> BINMAPSHIFT)
2092 #define idx2bit(i) ((1U << ((i) & ((1U << BINMAPSHIFT)-1))))
2094 #define mark_bin(m,i) ((m)->binmap[idx2block(i)] |= idx2bit(i))
2095 #define unmark_bin(m,i) ((m)->binmap[idx2block(i)] &= ~(idx2bit(i)))
2096 #define get_binmap(m,i) ((m)->binmap[idx2block(i)] & idx2bit(i))
2099 Fastbins
2101 An array of lists holding recently freed small chunks. Fastbins
2102 are not doubly linked. It is faster to single-link them, and
2103 since chunks are never removed from the middles of these lists,
2104 double linking is not necessary. Also, unlike regular bins, they
2105 are not even processed in FIFO order (they use faster LIFO) since
2106 ordering doesn't much matter in the transient contexts in which
2107 fastbins are normally used.
2109 Chunks in fastbins keep their inuse bit set, so they cannot
2110 be consolidated with other free chunks. malloc_consolidate
2111 releases all chunks in fastbins and consolidates them with
2112 other free chunks.
2115 typedef struct malloc_chunk* mfastbinptr;
2117 /* offset 2 to use otherwise unindexable first 2 bins */
2118 #define fastbin_index(sz) ((((unsigned int)(sz)) >> 3) - 2)
2120 /* The maximum fastbin request size we support */
2121 #define MAX_FAST_SIZE 80
2123 #define NFASTBINS (fastbin_index(request2size(MAX_FAST_SIZE))+1)
2126 FASTBIN_CONSOLIDATION_THRESHOLD is the size of a chunk in free()
2127 that triggers automatic consolidation of possibly-surrounding
2128 fastbin chunks. This is a heuristic, so the exact value should not
2129 matter too much. It is defined at half the default trim threshold as a
2130 compromise heuristic to only attempt consolidation if it is likely
2131 to lead to trimming. However, it is not dynamically tunable, since
2132 consolidation reduces fragmentation surrounding large chunks even
2133 if trimming is not used.
2136 #define FASTBIN_CONSOLIDATION_THRESHOLD (65536UL)
2139 Since the lowest 2 bits in max_fast don't matter in size comparisons,
2140 they are used as flags.
2144 FASTCHUNKS_BIT held in max_fast indicates that there are probably
2145 some fastbin chunks. It is set true on entering a chunk into any
2146 fastbin, and cleared only in malloc_consolidate.
2148 The truth value is inverted so that have_fastchunks will be true
2149 upon startup (since statics are zero-filled), simplifying
2150 initialization checks.
2153 #define FASTCHUNKS_BIT (1U)
2155 #define have_fastchunks(M) (((M)->max_fast & FASTCHUNKS_BIT) == 0)
2156 #define clear_fastchunks(M) ((M)->max_fast |= FASTCHUNKS_BIT)
2157 #define set_fastchunks(M) ((M)->max_fast &= ~FASTCHUNKS_BIT)
2160 NONCONTIGUOUS_BIT indicates that MORECORE does not return contiguous
2161 regions. Otherwise, contiguity is exploited in merging together,
2162 when possible, results from consecutive MORECORE calls.
2164 The initial value comes from MORECORE_CONTIGUOUS, but is
2165 changed dynamically if mmap is ever used as an sbrk substitute.
2168 #define NONCONTIGUOUS_BIT (2U)
2170 #define contiguous(M) (((M)->max_fast & NONCONTIGUOUS_BIT) == 0)
2171 #define noncontiguous(M) (((M)->max_fast & NONCONTIGUOUS_BIT) != 0)
2172 #define set_noncontiguous(M) ((M)->max_fast |= NONCONTIGUOUS_BIT)
2173 #define set_contiguous(M) ((M)->max_fast &= ~NONCONTIGUOUS_BIT)
2176 Set value of max_fast.
2177 Use impossibly small value if 0.
2178 Precondition: there are no existing fastbin chunks.
2179 Setting the value clears fastchunk bit but preserves noncontiguous bit.
2182 #define set_max_fast(M, s) \
2183 (M)->max_fast = (((s) == 0)? SMALLBIN_WIDTH: request2size(s)) | \
2184 FASTCHUNKS_BIT | \
2185 ((M)->max_fast & NONCONTIGUOUS_BIT)
2189 ----------- Internal state representation and initialization -----------
2192 struct malloc_state {
2193 /* Serialize access. */
2194 mutex_t mutex;
2195 // Should we have padding to move the mutex to its own cache line?
2197 #if THREAD_STATS
2198 /* Statistics for locking. Only used if THREAD_STATS is defined. */
2199 long stat_lock_direct, stat_lock_loop, stat_lock_wait;
2200 #endif
2202 /* The maximum chunk size to be eligible for fastbin */
2203 INTERNAL_SIZE_T max_fast; /* low 2 bits used as flags */
2205 /* Fastbins */
2206 mfastbinptr fastbins[NFASTBINS];
2208 /* Base of the topmost chunk -- not otherwise kept in a bin */
2209 mchunkptr top;
2211 /* The remainder from the most recent split of a small request */
2212 mchunkptr last_remainder;
2214 /* Normal bins packed as described above */
2215 mchunkptr bins[NBINS * 2];
2217 /* Bitmap of bins */
2218 unsigned int binmap[BINMAPSIZE];
2220 /* Linked list */
2221 struct malloc_state *next;
2223 /* Memory allocated from the system in this arena. */
2224 INTERNAL_SIZE_T system_mem;
2225 INTERNAL_SIZE_T max_system_mem;
2228 struct malloc_par {
2229 /* Tunable parameters */
2230 unsigned long trim_threshold;
2231 INTERNAL_SIZE_T top_pad;
2232 INTERNAL_SIZE_T mmap_threshold;
2234 /* Memory map support */
2235 int n_mmaps;
2236 int n_mmaps_max;
2237 int max_n_mmaps;
2239 /* Cache malloc_getpagesize */
2240 unsigned int pagesize;
2242 /* Statistics */
2243 INTERNAL_SIZE_T mmapped_mem;
2244 /*INTERNAL_SIZE_T sbrked_mem;*/
2245 /*INTERNAL_SIZE_T max_sbrked_mem;*/
2246 INTERNAL_SIZE_T max_mmapped_mem;
2247 INTERNAL_SIZE_T max_total_mem; /* only kept for NO_THREADS */
2249 /* First address handed out by MORECORE/sbrk. */
2250 char* sbrk_base;
2253 /* There are several instances of this struct ("arenas") in this
2254 malloc. If you are adapting this malloc in a way that does NOT use
2255 a static or mmapped malloc_state, you MUST explicitly zero-fill it
2256 before using. This malloc relies on the property that malloc_state
2257 is initialized to all zeroes (as is true of C statics). */
2259 static struct malloc_state main_arena;
2261 /* There is only one instance of the malloc parameters. */
2263 static struct malloc_par mp_;
2266 Initialize a malloc_state struct.
2268 This is called only from within malloc_consolidate, which needs
2269 be called in the same contexts anyway. It is never called directly
2270 outside of malloc_consolidate because some optimizing compilers try
2271 to inline it at all call points, which turns out not to be an
2272 optimization at all. (Inlining it in malloc_consolidate is fine though.)
2275 #if __STD_C
2276 static void malloc_init_state(mstate av)
2277 #else
2278 static void malloc_init_state(av) mstate av;
2279 #endif
2281 int i;
2282 mbinptr bin;
2284 /* Establish circular links for normal bins */
2285 for (i = 1; i < NBINS; ++i) {
2286 bin = bin_at(av,i);
2287 bin->fd = bin->bk = bin;
2290 #if MORECORE_CONTIGUOUS
2291 if (av != &main_arena)
2292 #endif
2293 set_noncontiguous(av);
2295 set_max_fast(av, DEFAULT_MXFAST);
2297 av->top = initial_top(av);
2301 Other internal utilities operating on mstates
2304 #if __STD_C
2305 static Void_t* sYSMALLOc(INTERNAL_SIZE_T, mstate);
2306 static int sYSTRIm(size_t, mstate);
2307 static void malloc_consolidate(mstate);
2308 static Void_t** iALLOc(mstate, size_t, size_t*, int, Void_t**);
2309 #else
2310 static Void_t* sYSMALLOc();
2311 static int sYSTRIm();
2312 static void malloc_consolidate();
2313 static Void_t** iALLOc();
2314 #endif
2317 /* -------------- Early definitions for debugging hooks ---------------- */
2319 /* Define and initialize the hook variables. These weak definitions must
2320 appear before any use of the variables in a function (arena.c uses one). */
2321 #ifndef weak_variable
2322 #ifndef _LIBC
2323 #define weak_variable /**/
2324 #else
2325 /* In GNU libc we want the hook variables to be weak definitions to
2326 avoid a problem with Emacs. */
2327 #define weak_variable weak_function
2328 #endif
2329 #endif
2331 /* Forward declarations. */
2332 static Void_t* malloc_hook_ini __MALLOC_P ((size_t sz,
2333 const __malloc_ptr_t caller));
2334 static Void_t* realloc_hook_ini __MALLOC_P ((Void_t* ptr, size_t sz,
2335 const __malloc_ptr_t caller));
2336 static Void_t* memalign_hook_ini __MALLOC_P ((size_t alignment, size_t sz,
2337 const __malloc_ptr_t caller));
2339 void weak_variable (*__malloc_initialize_hook) (void) = NULL;
2340 void weak_variable (*__free_hook) (__malloc_ptr_t __ptr,
2341 const __malloc_ptr_t) = NULL;
2342 __malloc_ptr_t weak_variable (*__malloc_hook)
2343 (size_t __size, const __malloc_ptr_t) = malloc_hook_ini;
2344 __malloc_ptr_t weak_variable (*__realloc_hook)
2345 (__malloc_ptr_t __ptr, size_t __size, const __malloc_ptr_t)
2346 = realloc_hook_ini;
2347 __malloc_ptr_t weak_variable (*__memalign_hook)
2348 (size_t __alignment, size_t __size, const __malloc_ptr_t)
2349 = memalign_hook_ini;
2350 void weak_variable (*__after_morecore_hook) (void) = NULL;
2353 /* ---------------- Error behavior ------------------------------------ */
2355 #ifndef DEFAULT_CHECK_ACTION
2356 #define DEFAULT_CHECK_ACTION 3
2357 #endif
2359 static int check_action = DEFAULT_CHECK_ACTION;
2362 /* ------------------- Support for multiple arenas -------------------- */
2363 #include "arena.c"
2366 Debugging support
2368 These routines make a number of assertions about the states
2369 of data structures that should be true at all times. If any
2370 are not true, it's very likely that a user program has somehow
2371 trashed memory. (It's also possible that there is a coding error
2372 in malloc. In which case, please report it!)
2375 #if ! MALLOC_DEBUG
2377 #define check_chunk(A,P)
2378 #define check_free_chunk(A,P)
2379 #define check_inuse_chunk(A,P)
2380 #define check_remalloced_chunk(A,P,N)
2381 #define check_malloced_chunk(A,P,N)
2382 #define check_malloc_state(A)
2384 #else
2386 #define check_chunk(A,P) do_check_chunk(A,P)
2387 #define check_free_chunk(A,P) do_check_free_chunk(A,P)
2388 #define check_inuse_chunk(A,P) do_check_inuse_chunk(A,P)
2389 #define check_remalloced_chunk(A,P,N) do_check_remalloced_chunk(A,P,N)
2390 #define check_malloced_chunk(A,P,N) do_check_malloced_chunk(A,P,N)
2391 #define check_malloc_state(A) do_check_malloc_state(A)
2394 Properties of all chunks
2397 #if __STD_C
2398 static void do_check_chunk(mstate av, mchunkptr p)
2399 #else
2400 static void do_check_chunk(av, p) mstate av; mchunkptr p;
2401 #endif
2403 unsigned long sz = chunksize(p);
2404 /* min and max possible addresses assuming contiguous allocation */
2405 char* max_address = (char*)(av->top) + chunksize(av->top);
2406 char* min_address = max_address - av->system_mem;
2408 if (!chunk_is_mmapped(p)) {
2410 /* Has legal address ... */
2411 if (p != av->top) {
2412 if (contiguous(av)) {
2413 assert(((char*)p) >= min_address);
2414 assert(((char*)p + sz) <= ((char*)(av->top)));
2417 else {
2418 /* top size is always at least MINSIZE */
2419 assert((unsigned long)(sz) >= MINSIZE);
2420 /* top predecessor always marked inuse */
2421 assert(prev_inuse(p));
2425 else {
2426 #if HAVE_MMAP
2427 /* address is outside main heap */
2428 if (contiguous(av) && av->top != initial_top(av)) {
2429 assert(((char*)p) < min_address || ((char*)p) > max_address);
2431 /* chunk is page-aligned */
2432 assert(((p->prev_size + sz) & (mp_.pagesize-1)) == 0);
2433 /* mem is aligned */
2434 assert(aligned_OK(chunk2mem(p)));
2435 #else
2436 /* force an appropriate assert violation if debug set */
2437 assert(!chunk_is_mmapped(p));
2438 #endif
2443 Properties of free chunks
2446 #if __STD_C
2447 static void do_check_free_chunk(mstate av, mchunkptr p)
2448 #else
2449 static void do_check_free_chunk(av, p) mstate av; mchunkptr p;
2450 #endif
2452 INTERNAL_SIZE_T sz = p->size & ~(PREV_INUSE|NON_MAIN_ARENA);
2453 mchunkptr next = chunk_at_offset(p, sz);
2455 do_check_chunk(av, p);
2457 /* Chunk must claim to be free ... */
2458 assert(!inuse(p));
2459 assert (!chunk_is_mmapped(p));
2461 /* Unless a special marker, must have OK fields */
2462 if ((unsigned long)(sz) >= MINSIZE)
2464 assert((sz & MALLOC_ALIGN_MASK) == 0);
2465 assert(aligned_OK(chunk2mem(p)));
2466 /* ... matching footer field */
2467 assert(next->prev_size == sz);
2468 /* ... and is fully consolidated */
2469 assert(prev_inuse(p));
2470 assert (next == av->top || inuse(next));
2472 /* ... and has minimally sane links */
2473 assert(p->fd->bk == p);
2474 assert(p->bk->fd == p);
2476 else /* markers are always of size SIZE_SZ */
2477 assert(sz == SIZE_SZ);
2481 Properties of inuse chunks
2484 #if __STD_C
2485 static void do_check_inuse_chunk(mstate av, mchunkptr p)
2486 #else
2487 static void do_check_inuse_chunk(av, p) mstate av; mchunkptr p;
2488 #endif
2490 mchunkptr next;
2492 do_check_chunk(av, p);
2494 if (chunk_is_mmapped(p))
2495 return; /* mmapped chunks have no next/prev */
2497 /* Check whether it claims to be in use ... */
2498 assert(inuse(p));
2500 next = next_chunk(p);
2502 /* ... and is surrounded by OK chunks.
2503 Since more things can be checked with free chunks than inuse ones,
2504 if an inuse chunk borders them and debug is on, it's worth doing them.
2506 if (!prev_inuse(p)) {
2507 /* Note that we cannot even look at prev unless it is not inuse */
2508 mchunkptr prv = prev_chunk(p);
2509 assert(next_chunk(prv) == p);
2510 do_check_free_chunk(av, prv);
2513 if (next == av->top) {
2514 assert(prev_inuse(next));
2515 assert(chunksize(next) >= MINSIZE);
2517 else if (!inuse(next))
2518 do_check_free_chunk(av, next);
2522 Properties of chunks recycled from fastbins
2525 #if __STD_C
2526 static void do_check_remalloced_chunk(mstate av, mchunkptr p, INTERNAL_SIZE_T s)
2527 #else
2528 static void do_check_remalloced_chunk(av, p, s)
2529 mstate av; mchunkptr p; INTERNAL_SIZE_T s;
2530 #endif
2532 INTERNAL_SIZE_T sz = p->size & ~(PREV_INUSE|NON_MAIN_ARENA);
2534 if (!chunk_is_mmapped(p)) {
2535 assert(av == arena_for_chunk(p));
2536 if (chunk_non_main_arena(p))
2537 assert(av != &main_arena);
2538 else
2539 assert(av == &main_arena);
2542 do_check_inuse_chunk(av, p);
2544 /* Legal size ... */
2545 assert((sz & MALLOC_ALIGN_MASK) == 0);
2546 assert((unsigned long)(sz) >= MINSIZE);
2547 /* ... and alignment */
2548 assert(aligned_OK(chunk2mem(p)));
2549 /* chunk is less than MINSIZE more than request */
2550 assert((long)(sz) - (long)(s) >= 0);
2551 assert((long)(sz) - (long)(s + MINSIZE) < 0);
2555 Properties of nonrecycled chunks at the point they are malloced
2558 #if __STD_C
2559 static void do_check_malloced_chunk(mstate av, mchunkptr p, INTERNAL_SIZE_T s)
2560 #else
2561 static void do_check_malloced_chunk(av, p, s)
2562 mstate av; mchunkptr p; INTERNAL_SIZE_T s;
2563 #endif
2565 /* same as recycled case ... */
2566 do_check_remalloced_chunk(av, p, s);
2569 ... plus, must obey implementation invariant that prev_inuse is
2570 always true of any allocated chunk; i.e., that each allocated
2571 chunk borders either a previously allocated and still in-use
2572 chunk, or the base of its memory arena. This is ensured
2573 by making all allocations from the the `lowest' part of any found
2574 chunk. This does not necessarily hold however for chunks
2575 recycled via fastbins.
2578 assert(prev_inuse(p));
2583 Properties of malloc_state.
2585 This may be useful for debugging malloc, as well as detecting user
2586 programmer errors that somehow write into malloc_state.
2588 If you are extending or experimenting with this malloc, you can
2589 probably figure out how to hack this routine to print out or
2590 display chunk addresses, sizes, bins, and other instrumentation.
2593 static void do_check_malloc_state(mstate av)
2595 int i;
2596 mchunkptr p;
2597 mchunkptr q;
2598 mbinptr b;
2599 unsigned int binbit;
2600 int empty;
2601 unsigned int idx;
2602 INTERNAL_SIZE_T size;
2603 unsigned long total = 0;
2604 int max_fast_bin;
2606 /* internal size_t must be no wider than pointer type */
2607 assert(sizeof(INTERNAL_SIZE_T) <= sizeof(char*));
2609 /* alignment is a power of 2 */
2610 assert((MALLOC_ALIGNMENT & (MALLOC_ALIGNMENT-1)) == 0);
2612 /* cannot run remaining checks until fully initialized */
2613 if (av->top == 0 || av->top == initial_top(av))
2614 return;
2616 /* pagesize is a power of 2 */
2617 assert((mp_.pagesize & (mp_.pagesize-1)) == 0);
2619 /* A contiguous main_arena is consistent with sbrk_base. */
2620 if (av == &main_arena && contiguous(av))
2621 assert((char*)mp_.sbrk_base + av->system_mem ==
2622 (char*)av->top + chunksize(av->top));
2624 /* properties of fastbins */
2626 /* max_fast is in allowed range */
2627 assert((av->max_fast & ~1) <= request2size(MAX_FAST_SIZE));
2629 max_fast_bin = fastbin_index(av->max_fast);
2631 for (i = 0; i < NFASTBINS; ++i) {
2632 p = av->fastbins[i];
2634 /* all bins past max_fast are empty */
2635 if (i > max_fast_bin)
2636 assert(p == 0);
2638 while (p != 0) {
2639 /* each chunk claims to be inuse */
2640 do_check_inuse_chunk(av, p);
2641 total += chunksize(p);
2642 /* chunk belongs in this bin */
2643 assert(fastbin_index(chunksize(p)) == i);
2644 p = p->fd;
2648 if (total != 0)
2649 assert(have_fastchunks(av));
2650 else if (!have_fastchunks(av))
2651 assert(total == 0);
2653 /* check normal bins */
2654 for (i = 1; i < NBINS; ++i) {
2655 b = bin_at(av,i);
2657 /* binmap is accurate (except for bin 1 == unsorted_chunks) */
2658 if (i >= 2) {
2659 binbit = get_binmap(av,i);
2660 empty = last(b) == b;
2661 if (!binbit)
2662 assert(empty);
2663 else if (!empty)
2664 assert(binbit);
2667 for (p = last(b); p != b; p = p->bk) {
2668 /* each chunk claims to be free */
2669 do_check_free_chunk(av, p);
2670 size = chunksize(p);
2671 total += size;
2672 if (i >= 2) {
2673 /* chunk belongs in bin */
2674 idx = bin_index(size);
2675 assert(idx == i);
2676 /* lists are sorted */
2677 assert(p->bk == b ||
2678 (unsigned long)chunksize(p->bk) >= (unsigned long)chunksize(p));
2680 /* chunk is followed by a legal chain of inuse chunks */
2681 for (q = next_chunk(p);
2682 (q != av->top && inuse(q) &&
2683 (unsigned long)(chunksize(q)) >= MINSIZE);
2684 q = next_chunk(q))
2685 do_check_inuse_chunk(av, q);
2689 /* top chunk is OK */
2690 check_chunk(av, av->top);
2692 /* sanity checks for statistics */
2694 #ifdef NO_THREADS
2695 assert(total <= (unsigned long)(mp_.max_total_mem));
2696 assert(mp_.n_mmaps >= 0);
2697 #endif
2698 assert(mp_.n_mmaps <= mp_.n_mmaps_max);
2699 assert(mp_.n_mmaps <= mp_.max_n_mmaps);
2701 assert((unsigned long)(av->system_mem) <=
2702 (unsigned long)(av->max_system_mem));
2704 assert((unsigned long)(mp_.mmapped_mem) <=
2705 (unsigned long)(mp_.max_mmapped_mem));
2707 #ifdef NO_THREADS
2708 assert((unsigned long)(mp_.max_total_mem) >=
2709 (unsigned long)(mp_.mmapped_mem) + (unsigned long)(av->system_mem));
2710 #endif
2712 #endif
2715 /* ----------------- Support for debugging hooks -------------------- */
2716 #include "hooks.c"
2719 /* ----------- Routines dealing with system allocation -------------- */
2722 sysmalloc handles malloc cases requiring more memory from the system.
2723 On entry, it is assumed that av->top does not have enough
2724 space to service request for nb bytes, thus requiring that av->top
2725 be extended or replaced.
2728 #if __STD_C
2729 static Void_t* sYSMALLOc(INTERNAL_SIZE_T nb, mstate av)
2730 #else
2731 static Void_t* sYSMALLOc(nb, av) INTERNAL_SIZE_T nb; mstate av;
2732 #endif
2734 mchunkptr old_top; /* incoming value of av->top */
2735 INTERNAL_SIZE_T old_size; /* its size */
2736 char* old_end; /* its end address */
2738 long size; /* arg to first MORECORE or mmap call */
2739 char* brk; /* return value from MORECORE */
2741 long correction; /* arg to 2nd MORECORE call */
2742 char* snd_brk; /* 2nd return val */
2744 INTERNAL_SIZE_T front_misalign; /* unusable bytes at front of new space */
2745 INTERNAL_SIZE_T end_misalign; /* partial page left at end of new space */
2746 char* aligned_brk; /* aligned offset into brk */
2748 mchunkptr p; /* the allocated/returned chunk */
2749 mchunkptr remainder; /* remainder from allocation */
2750 unsigned long remainder_size; /* its size */
2752 unsigned long sum; /* for updating stats */
2754 size_t pagemask = mp_.pagesize - 1;
2757 #if HAVE_MMAP
2760 If have mmap, and the request size meets the mmap threshold, and
2761 the system supports mmap, and there are few enough currently
2762 allocated mmapped regions, try to directly map this request
2763 rather than expanding top.
2766 if ((unsigned long)(nb) >= (unsigned long)(mp_.mmap_threshold) &&
2767 (mp_.n_mmaps < mp_.n_mmaps_max)) {
2769 char* mm; /* return value from mmap call*/
2772 Round up size to nearest page. For mmapped chunks, the overhead
2773 is one SIZE_SZ unit larger than for normal chunks, because there
2774 is no following chunk whose prev_size field could be used.
2776 size = (nb + SIZE_SZ + MALLOC_ALIGN_MASK + pagemask) & ~pagemask;
2778 /* Don't try if size wraps around 0 */
2779 if ((unsigned long)(size) > (unsigned long)(nb)) {
2781 mm = (char*)(MMAP(0, size, PROT_READ|PROT_WRITE, MAP_PRIVATE));
2783 if (mm != MAP_FAILED) {
2786 The offset to the start of the mmapped region is stored
2787 in the prev_size field of the chunk. This allows us to adjust
2788 returned start address to meet alignment requirements here
2789 and in memalign(), and still be able to compute proper
2790 address argument for later munmap in free() and realloc().
2793 front_misalign = (INTERNAL_SIZE_T)chunk2mem(mm) & MALLOC_ALIGN_MASK;
2794 if (front_misalign > 0) {
2795 correction = MALLOC_ALIGNMENT - front_misalign;
2796 p = (mchunkptr)(mm + correction);
2797 p->prev_size = correction;
2798 set_head(p, (size - correction) |IS_MMAPPED);
2800 else {
2801 p = (mchunkptr)mm;
2802 set_head(p, size|IS_MMAPPED);
2805 /* update statistics */
2807 if (++mp_.n_mmaps > mp_.max_n_mmaps)
2808 mp_.max_n_mmaps = mp_.n_mmaps;
2810 sum = mp_.mmapped_mem += size;
2811 if (sum > (unsigned long)(mp_.max_mmapped_mem))
2812 mp_.max_mmapped_mem = sum;
2813 #ifdef NO_THREADS
2814 sum += av->system_mem;
2815 if (sum > (unsigned long)(mp_.max_total_mem))
2816 mp_.max_total_mem = sum;
2817 #endif
2819 check_chunk(av, p);
2821 return chunk2mem(p);
2825 #endif
2827 /* Record incoming configuration of top */
2829 old_top = av->top;
2830 old_size = chunksize(old_top);
2831 old_end = (char*)(chunk_at_offset(old_top, old_size));
2833 brk = snd_brk = (char*)(MORECORE_FAILURE);
2836 If not the first time through, we require old_size to be
2837 at least MINSIZE and to have prev_inuse set.
2840 assert((old_top == initial_top(av) && old_size == 0) ||
2841 ((unsigned long) (old_size) >= MINSIZE &&
2842 prev_inuse(old_top) &&
2843 ((unsigned long)old_end & pagemask) == 0));
2845 /* Precondition: not enough current space to satisfy nb request */
2846 assert((unsigned long)(old_size) < (unsigned long)(nb + MINSIZE));
2848 /* Precondition: all fastbins are consolidated */
2849 assert(!have_fastchunks(av));
2852 if (av != &main_arena) {
2854 heap_info *old_heap, *heap;
2855 size_t old_heap_size;
2857 /* First try to extend the current heap. */
2858 old_heap = heap_for_ptr(old_top);
2859 old_heap_size = old_heap->size;
2860 if (grow_heap(old_heap, MINSIZE + nb - old_size) == 0) {
2861 av->system_mem += old_heap->size - old_heap_size;
2862 arena_mem += old_heap->size - old_heap_size;
2863 #if 0
2864 if(mmapped_mem + arena_mem + sbrked_mem > max_total_mem)
2865 max_total_mem = mmapped_mem + arena_mem + sbrked_mem;
2866 #endif
2867 set_head(old_top, (((char *)old_heap + old_heap->size) - (char *)old_top)
2868 | PREV_INUSE);
2870 else if ((heap = new_heap(nb + (MINSIZE + sizeof(*heap)), mp_.top_pad))) {
2871 /* Use a newly allocated heap. */
2872 heap->ar_ptr = av;
2873 heap->prev = old_heap;
2874 av->system_mem += heap->size;
2875 arena_mem += heap->size;
2876 #if 0
2877 if((unsigned long)(mmapped_mem + arena_mem + sbrked_mem) > max_total_mem)
2878 max_total_mem = mmapped_mem + arena_mem + sbrked_mem;
2879 #endif
2880 /* Set up the new top. */
2881 top(av) = chunk_at_offset(heap, sizeof(*heap));
2882 set_head(top(av), (heap->size - sizeof(*heap)) | PREV_INUSE);
2884 /* Setup fencepost and free the old top chunk. */
2885 /* The fencepost takes at least MINSIZE bytes, because it might
2886 become the top chunk again later. Note that a footer is set
2887 up, too, although the chunk is marked in use. */
2888 old_size -= MINSIZE;
2889 set_head(chunk_at_offset(old_top, old_size + 2*SIZE_SZ), 0|PREV_INUSE);
2890 if (old_size >= MINSIZE) {
2891 set_head(chunk_at_offset(old_top, old_size), (2*SIZE_SZ)|PREV_INUSE);
2892 set_foot(chunk_at_offset(old_top, old_size), (2*SIZE_SZ));
2893 set_head(old_top, old_size|PREV_INUSE|NON_MAIN_ARENA);
2894 _int_free(av, chunk2mem(old_top));
2895 } else {
2896 set_head(old_top, (old_size + 2*SIZE_SZ)|PREV_INUSE);
2897 set_foot(old_top, (old_size + 2*SIZE_SZ));
2901 } else { /* av == main_arena */
2904 /* Request enough space for nb + pad + overhead */
2906 size = nb + mp_.top_pad + MINSIZE;
2909 If contiguous, we can subtract out existing space that we hope to
2910 combine with new space. We add it back later only if
2911 we don't actually get contiguous space.
2914 if (contiguous(av))
2915 size -= old_size;
2918 Round to a multiple of page size.
2919 If MORECORE is not contiguous, this ensures that we only call it
2920 with whole-page arguments. And if MORECORE is contiguous and
2921 this is not first time through, this preserves page-alignment of
2922 previous calls. Otherwise, we correct to page-align below.
2925 size = (size + pagemask) & ~pagemask;
2928 Don't try to call MORECORE if argument is so big as to appear
2929 negative. Note that since mmap takes size_t arg, it may succeed
2930 below even if we cannot call MORECORE.
2933 if (size > 0)
2934 brk = (char*)(MORECORE(size));
2936 if (brk != (char*)(MORECORE_FAILURE)) {
2937 /* Call the `morecore' hook if necessary. */
2938 if (__after_morecore_hook)
2939 (*__after_morecore_hook) ();
2940 } else {
2942 If have mmap, try using it as a backup when MORECORE fails or
2943 cannot be used. This is worth doing on systems that have "holes" in
2944 address space, so sbrk cannot extend to give contiguous space, but
2945 space is available elsewhere. Note that we ignore mmap max count
2946 and threshold limits, since the space will not be used as a
2947 segregated mmap region.
2950 #if HAVE_MMAP
2951 /* Cannot merge with old top, so add its size back in */
2952 if (contiguous(av))
2953 size = (size + old_size + pagemask) & ~pagemask;
2955 /* If we are relying on mmap as backup, then use larger units */
2956 if ((unsigned long)(size) < (unsigned long)(MMAP_AS_MORECORE_SIZE))
2957 size = MMAP_AS_MORECORE_SIZE;
2959 /* Don't try if size wraps around 0 */
2960 if ((unsigned long)(size) > (unsigned long)(nb)) {
2962 char *mbrk = (char*)(MMAP(0, size, PROT_READ|PROT_WRITE, MAP_PRIVATE));
2964 if (mbrk != MAP_FAILED) {
2966 /* We do not need, and cannot use, another sbrk call to find end */
2967 brk = mbrk;
2968 snd_brk = brk + size;
2971 Record that we no longer have a contiguous sbrk region.
2972 After the first time mmap is used as backup, we do not
2973 ever rely on contiguous space since this could incorrectly
2974 bridge regions.
2976 set_noncontiguous(av);
2979 #endif
2982 if (brk != (char*)(MORECORE_FAILURE)) {
2983 if (mp_.sbrk_base == 0)
2984 mp_.sbrk_base = brk;
2985 av->system_mem += size;
2988 If MORECORE extends previous space, we can likewise extend top size.
2991 if (brk == old_end && snd_brk == (char*)(MORECORE_FAILURE))
2992 set_head(old_top, (size + old_size) | PREV_INUSE);
2994 else if (contiguous(av) && old_size && brk < old_end) {
2995 /* Oops! Someone else killed our space.. Can't touch anything. */
2996 assert(0);
3000 Otherwise, make adjustments:
3002 * If the first time through or noncontiguous, we need to call sbrk
3003 just to find out where the end of memory lies.
3005 * We need to ensure that all returned chunks from malloc will meet
3006 MALLOC_ALIGNMENT
3008 * If there was an intervening foreign sbrk, we need to adjust sbrk
3009 request size to account for fact that we will not be able to
3010 combine new space with existing space in old_top.
3012 * Almost all systems internally allocate whole pages at a time, in
3013 which case we might as well use the whole last page of request.
3014 So we allocate enough more memory to hit a page boundary now,
3015 which in turn causes future contiguous calls to page-align.
3018 else {
3019 front_misalign = 0;
3020 end_misalign = 0;
3021 correction = 0;
3022 aligned_brk = brk;
3024 /* handle contiguous cases */
3025 if (contiguous(av)) {
3027 /* Count foreign sbrk as system_mem. */
3028 if (old_size)
3029 av->system_mem += brk - old_end;
3031 /* Guarantee alignment of first new chunk made from this space */
3033 front_misalign = (INTERNAL_SIZE_T)chunk2mem(brk) & MALLOC_ALIGN_MASK;
3034 if (front_misalign > 0) {
3037 Skip over some bytes to arrive at an aligned position.
3038 We don't need to specially mark these wasted front bytes.
3039 They will never be accessed anyway because
3040 prev_inuse of av->top (and any chunk created from its start)
3041 is always true after initialization.
3044 correction = MALLOC_ALIGNMENT - front_misalign;
3045 aligned_brk += correction;
3049 If this isn't adjacent to existing space, then we will not
3050 be able to merge with old_top space, so must add to 2nd request.
3053 correction += old_size;
3055 /* Extend the end address to hit a page boundary */
3056 end_misalign = (INTERNAL_SIZE_T)(brk + size + correction);
3057 correction += ((end_misalign + pagemask) & ~pagemask) - end_misalign;
3059 assert(correction >= 0);
3060 snd_brk = (char*)(MORECORE(correction));
3063 If can't allocate correction, try to at least find out current
3064 brk. It might be enough to proceed without failing.
3066 Note that if second sbrk did NOT fail, we assume that space
3067 is contiguous with first sbrk. This is a safe assumption unless
3068 program is multithreaded but doesn't use locks and a foreign sbrk
3069 occurred between our first and second calls.
3072 if (snd_brk == (char*)(MORECORE_FAILURE)) {
3073 correction = 0;
3074 snd_brk = (char*)(MORECORE(0));
3075 } else
3076 /* Call the `morecore' hook if necessary. */
3077 if (__after_morecore_hook)
3078 (*__after_morecore_hook) ();
3081 /* handle non-contiguous cases */
3082 else {
3083 /* MORECORE/mmap must correctly align */
3084 assert(((unsigned long)chunk2mem(brk) & MALLOC_ALIGN_MASK) == 0);
3086 /* Find out current end of memory */
3087 if (snd_brk == (char*)(MORECORE_FAILURE)) {
3088 snd_brk = (char*)(MORECORE(0));
3092 /* Adjust top based on results of second sbrk */
3093 if (snd_brk != (char*)(MORECORE_FAILURE)) {
3094 av->top = (mchunkptr)aligned_brk;
3095 set_head(av->top, (snd_brk - aligned_brk + correction) | PREV_INUSE);
3096 av->system_mem += correction;
3099 If not the first time through, we either have a
3100 gap due to foreign sbrk or a non-contiguous region. Insert a
3101 double fencepost at old_top to prevent consolidation with space
3102 we don't own. These fenceposts are artificial chunks that are
3103 marked as inuse and are in any case too small to use. We need
3104 two to make sizes and alignments work out.
3107 if (old_size != 0) {
3109 Shrink old_top to insert fenceposts, keeping size a
3110 multiple of MALLOC_ALIGNMENT. We know there is at least
3111 enough space in old_top to do this.
3113 old_size = (old_size - 4*SIZE_SZ) & ~MALLOC_ALIGN_MASK;
3114 set_head(old_top, old_size | PREV_INUSE);
3117 Note that the following assignments completely overwrite
3118 old_top when old_size was previously MINSIZE. This is
3119 intentional. We need the fencepost, even if old_top otherwise gets
3120 lost.
3122 chunk_at_offset(old_top, old_size )->size =
3123 (2*SIZE_SZ)|PREV_INUSE;
3125 chunk_at_offset(old_top, old_size + 2*SIZE_SZ)->size =
3126 (2*SIZE_SZ)|PREV_INUSE;
3128 /* If possible, release the rest. */
3129 if (old_size >= MINSIZE) {
3130 _int_free(av, chunk2mem(old_top));
3137 /* Update statistics */
3138 #ifdef NO_THREADS
3139 sum = av->system_mem + mp_.mmapped_mem;
3140 if (sum > (unsigned long)(mp_.max_total_mem))
3141 mp_.max_total_mem = sum;
3142 #endif
3146 } /* if (av != &main_arena) */
3148 if ((unsigned long)av->system_mem > (unsigned long)(av->max_system_mem))
3149 av->max_system_mem = av->system_mem;
3150 check_malloc_state(av);
3152 /* finally, do the allocation */
3153 p = av->top;
3154 size = chunksize(p);
3156 /* check that one of the above allocation paths succeeded */
3157 if ((unsigned long)(size) >= (unsigned long)(nb + MINSIZE)) {
3158 remainder_size = size - nb;
3159 remainder = chunk_at_offset(p, nb);
3160 av->top = remainder;
3161 set_head(p, nb | PREV_INUSE | (av != &main_arena ? NON_MAIN_ARENA : 0));
3162 set_head(remainder, remainder_size | PREV_INUSE);
3163 check_malloced_chunk(av, p, nb);
3164 return chunk2mem(p);
3167 /* catch all failure paths */
3168 MALLOC_FAILURE_ACTION;
3169 return 0;
3174 sYSTRIm is an inverse of sorts to sYSMALLOc. It gives memory back
3175 to the system (via negative arguments to sbrk) if there is unused
3176 memory at the `high' end of the malloc pool. It is called
3177 automatically by free() when top space exceeds the trim
3178 threshold. It is also called by the public malloc_trim routine. It
3179 returns 1 if it actually released any memory, else 0.
3182 #if __STD_C
3183 static int sYSTRIm(size_t pad, mstate av)
3184 #else
3185 static int sYSTRIm(pad, av) size_t pad; mstate av;
3186 #endif
3188 long top_size; /* Amount of top-most memory */
3189 long extra; /* Amount to release */
3190 long released; /* Amount actually released */
3191 char* current_brk; /* address returned by pre-check sbrk call */
3192 char* new_brk; /* address returned by post-check sbrk call */
3193 size_t pagesz;
3195 pagesz = mp_.pagesize;
3196 top_size = chunksize(av->top);
3198 /* Release in pagesize units, keeping at least one page */
3199 extra = ((top_size - pad - MINSIZE + (pagesz-1)) / pagesz - 1) * pagesz;
3201 if (extra > 0) {
3204 Only proceed if end of memory is where we last set it.
3205 This avoids problems if there were foreign sbrk calls.
3207 current_brk = (char*)(MORECORE(0));
3208 if (current_brk == (char*)(av->top) + top_size) {
3211 Attempt to release memory. We ignore MORECORE return value,
3212 and instead call again to find out where new end of memory is.
3213 This avoids problems if first call releases less than we asked,
3214 of if failure somehow altered brk value. (We could still
3215 encounter problems if it altered brk in some very bad way,
3216 but the only thing we can do is adjust anyway, which will cause
3217 some downstream failure.)
3220 MORECORE(-extra);
3221 /* Call the `morecore' hook if necessary. */
3222 if (__after_morecore_hook)
3223 (*__after_morecore_hook) ();
3224 new_brk = (char*)(MORECORE(0));
3226 if (new_brk != (char*)MORECORE_FAILURE) {
3227 released = (long)(current_brk - new_brk);
3229 if (released != 0) {
3230 /* Success. Adjust top. */
3231 av->system_mem -= released;
3232 set_head(av->top, (top_size - released) | PREV_INUSE);
3233 check_malloc_state(av);
3234 return 1;
3239 return 0;
3242 #ifdef HAVE_MMAP
3244 static void
3245 internal_function
3246 #if __STD_C
3247 munmap_chunk(mchunkptr p)
3248 #else
3249 munmap_chunk(p) mchunkptr p;
3250 #endif
3252 INTERNAL_SIZE_T size = chunksize(p);
3253 int ret;
3255 assert (chunk_is_mmapped(p));
3256 #if 0
3257 assert(! ((char*)p >= mp_.sbrk_base && (char*)p < mp_.sbrk_base + mp_.sbrked_mem));
3258 assert((mp_.n_mmaps > 0));
3259 #endif
3260 assert(((p->prev_size + size) & (mp_.pagesize-1)) == 0);
3262 mp_.n_mmaps--;
3263 mp_.mmapped_mem -= (size + p->prev_size);
3265 ret = munmap((char *)p - p->prev_size, size + p->prev_size);
3267 /* munmap returns non-zero on failure */
3268 assert(ret == 0);
3271 #if HAVE_MREMAP
3273 static mchunkptr
3274 internal_function
3275 #if __STD_C
3276 mremap_chunk(mchunkptr p, size_t new_size)
3277 #else
3278 mremap_chunk(p, new_size) mchunkptr p; size_t new_size;
3279 #endif
3281 size_t page_mask = mp_.pagesize - 1;
3282 INTERNAL_SIZE_T offset = p->prev_size;
3283 INTERNAL_SIZE_T size = chunksize(p);
3284 char *cp;
3286 assert (chunk_is_mmapped(p));
3287 #if 0
3288 assert(! ((char*)p >= mp_.sbrk_base && (char*)p < mp_.sbrk_base + mp_.sbrked_mem));
3289 assert((mp_.n_mmaps > 0));
3290 #endif
3291 assert(((size + offset) & (mp_.pagesize-1)) == 0);
3293 /* Note the extra SIZE_SZ overhead as in mmap_chunk(). */
3294 new_size = (new_size + offset + SIZE_SZ + page_mask) & ~page_mask;
3296 cp = (char *)mremap((char *)p - offset, size + offset, new_size,
3297 MREMAP_MAYMOVE);
3299 if (cp == MAP_FAILED) return 0;
3301 p = (mchunkptr)(cp + offset);
3303 assert(aligned_OK(chunk2mem(p)));
3305 assert((p->prev_size == offset));
3306 set_head(p, (new_size - offset)|IS_MMAPPED);
3308 mp_.mmapped_mem -= size + offset;
3309 mp_.mmapped_mem += new_size;
3310 if ((unsigned long)mp_.mmapped_mem > (unsigned long)mp_.max_mmapped_mem)
3311 mp_.max_mmapped_mem = mp_.mmapped_mem;
3312 #ifdef NO_THREADS
3313 if ((unsigned long)(mp_.mmapped_mem + arena_mem + main_arena.system_mem) >
3314 mp_.max_total_mem)
3315 mp_.max_total_mem = mp_.mmapped_mem + arena_mem + main_arena.system_mem;
3316 #endif
3317 return p;
3320 #endif /* HAVE_MREMAP */
3322 #endif /* HAVE_MMAP */
3324 /*------------------------ Public wrappers. --------------------------------*/
3326 Void_t*
3327 public_mALLOc(size_t bytes)
3329 mstate ar_ptr;
3330 Void_t *victim;
3332 __malloc_ptr_t (*hook) (size_t, __const __malloc_ptr_t) = __malloc_hook;
3333 if (hook != NULL)
3334 return (*hook)(bytes, RETURN_ADDRESS (0));
3336 arena_get(ar_ptr, bytes);
3337 if(!ar_ptr)
3338 return 0;
3339 victim = _int_malloc(ar_ptr, bytes);
3340 if(!victim) {
3341 /* Maybe the failure is due to running out of mmapped areas. */
3342 if(ar_ptr != &main_arena) {
3343 (void)mutex_unlock(&ar_ptr->mutex);
3344 (void)mutex_lock(&main_arena.mutex);
3345 victim = _int_malloc(&main_arena, bytes);
3346 (void)mutex_unlock(&main_arena.mutex);
3347 } else {
3348 #if USE_ARENAS
3349 /* ... or sbrk() has failed and there is still a chance to mmap() */
3350 ar_ptr = arena_get2(ar_ptr->next ? ar_ptr : 0, bytes);
3351 (void)mutex_unlock(&main_arena.mutex);
3352 if(ar_ptr) {
3353 victim = _int_malloc(ar_ptr, bytes);
3354 (void)mutex_unlock(&ar_ptr->mutex);
3356 #endif
3358 } else
3359 (void)mutex_unlock(&ar_ptr->mutex);
3360 assert(!victim || chunk_is_mmapped(mem2chunk(victim)) ||
3361 ar_ptr == arena_for_chunk(mem2chunk(victim)));
3362 return victim;
3364 #ifdef libc_hidden_def
3365 libc_hidden_def(public_mALLOc)
3366 #endif
3368 void
3369 public_fREe(Void_t* mem)
3371 mstate ar_ptr;
3372 mchunkptr p; /* chunk corresponding to mem */
3374 void (*hook) (__malloc_ptr_t, __const __malloc_ptr_t) = __free_hook;
3375 if (hook != NULL) {
3376 (*hook)(mem, RETURN_ADDRESS (0));
3377 return;
3380 if (mem == 0) /* free(0) has no effect */
3381 return;
3383 p = mem2chunk(mem);
3385 #if HAVE_MMAP
3386 if (chunk_is_mmapped(p)) /* release mmapped memory. */
3388 munmap_chunk(p);
3389 return;
3391 #endif
3393 ar_ptr = arena_for_chunk(p);
3394 #if THREAD_STATS
3395 if(!mutex_trylock(&ar_ptr->mutex))
3396 ++(ar_ptr->stat_lock_direct);
3397 else {
3398 (void)mutex_lock(&ar_ptr->mutex);
3399 ++(ar_ptr->stat_lock_wait);
3401 #else
3402 (void)mutex_lock(&ar_ptr->mutex);
3403 #endif
3404 _int_free(ar_ptr, mem);
3405 (void)mutex_unlock(&ar_ptr->mutex);
3407 #ifdef libc_hidden_def
3408 libc_hidden_def (public_fREe)
3409 #endif
3411 Void_t*
3412 public_rEALLOc(Void_t* oldmem, size_t bytes)
3414 mstate ar_ptr;
3415 INTERNAL_SIZE_T nb; /* padded request size */
3417 mchunkptr oldp; /* chunk corresponding to oldmem */
3418 INTERNAL_SIZE_T oldsize; /* its size */
3420 Void_t* newp; /* chunk to return */
3422 __malloc_ptr_t (*hook) (__malloc_ptr_t, size_t, __const __malloc_ptr_t) =
3423 __realloc_hook;
3424 if (hook != NULL)
3425 return (*hook)(oldmem, bytes, RETURN_ADDRESS (0));
3427 #if REALLOC_ZERO_BYTES_FREES
3428 if (bytes == 0 && oldmem != NULL) { public_fREe(oldmem); return 0; }
3429 #endif
3431 /* realloc of null is supposed to be same as malloc */
3432 if (oldmem == 0) return public_mALLOc(bytes);
3434 oldp = mem2chunk(oldmem);
3435 oldsize = chunksize(oldp);
3437 /* Little security check which won't hurt performance: the
3438 allocator never wrapps around at the end of the address space.
3439 Therefore we can exclude some size values which might appear
3440 here by accident or by "design" from some intruder. */
3441 if (__builtin_expect ((uintptr_t) oldp > (uintptr_t) -oldsize, 0)
3442 || __builtin_expect ((uintptr_t) oldp & MALLOC_ALIGN_MASK, 0))
3444 malloc_printerr (check_action, "realloc(): invalid pointer", oldmem);
3445 return NULL;
3448 checked_request2size(bytes, nb);
3450 #if HAVE_MMAP
3451 if (chunk_is_mmapped(oldp))
3453 Void_t* newmem;
3455 #if HAVE_MREMAP
3456 newp = mremap_chunk(oldp, nb);
3457 if(newp) return chunk2mem(newp);
3458 #endif
3459 /* Note the extra SIZE_SZ overhead. */
3460 if(oldsize - SIZE_SZ >= nb) return oldmem; /* do nothing */
3461 /* Must alloc, copy, free. */
3462 newmem = public_mALLOc(bytes);
3463 if (newmem == 0) return 0; /* propagate failure */
3464 MALLOC_COPY(newmem, oldmem, oldsize - 2*SIZE_SZ);
3465 munmap_chunk(oldp);
3466 return newmem;
3468 #endif
3470 ar_ptr = arena_for_chunk(oldp);
3471 #if THREAD_STATS
3472 if(!mutex_trylock(&ar_ptr->mutex))
3473 ++(ar_ptr->stat_lock_direct);
3474 else {
3475 (void)mutex_lock(&ar_ptr->mutex);
3476 ++(ar_ptr->stat_lock_wait);
3478 #else
3479 (void)mutex_lock(&ar_ptr->mutex);
3480 #endif
3482 #ifndef NO_THREADS
3483 /* As in malloc(), remember this arena for the next allocation. */
3484 tsd_setspecific(arena_key, (Void_t *)ar_ptr);
3485 #endif
3487 newp = _int_realloc(ar_ptr, oldmem, bytes);
3489 (void)mutex_unlock(&ar_ptr->mutex);
3490 assert(!newp || chunk_is_mmapped(mem2chunk(newp)) ||
3491 ar_ptr == arena_for_chunk(mem2chunk(newp)));
3492 return newp;
3494 #ifdef libc_hidden_def
3495 libc_hidden_def (public_rEALLOc)
3496 #endif
3498 Void_t*
3499 public_mEMALIGn(size_t alignment, size_t bytes)
3501 mstate ar_ptr;
3502 Void_t *p;
3504 __malloc_ptr_t (*hook) __MALLOC_PMT ((size_t, size_t,
3505 __const __malloc_ptr_t)) =
3506 __memalign_hook;
3507 if (hook != NULL)
3508 return (*hook)(alignment, bytes, RETURN_ADDRESS (0));
3510 /* If need less alignment than we give anyway, just relay to malloc */
3511 if (alignment <= MALLOC_ALIGNMENT) return public_mALLOc(bytes);
3513 /* Otherwise, ensure that it is at least a minimum chunk size */
3514 if (alignment < MINSIZE) alignment = MINSIZE;
3516 arena_get(ar_ptr, bytes + alignment + MINSIZE);
3517 if(!ar_ptr)
3518 return 0;
3519 p = _int_memalign(ar_ptr, alignment, bytes);
3520 (void)mutex_unlock(&ar_ptr->mutex);
3521 if(!p) {
3522 /* Maybe the failure is due to running out of mmapped areas. */
3523 if(ar_ptr != &main_arena) {
3524 (void)mutex_lock(&main_arena.mutex);
3525 p = _int_memalign(&main_arena, alignment, bytes);
3526 (void)mutex_unlock(&main_arena.mutex);
3527 } else {
3528 #if USE_ARENAS
3529 /* ... or sbrk() has failed and there is still a chance to mmap() */
3530 ar_ptr = arena_get2(ar_ptr->next ? ar_ptr : 0, bytes);
3531 if(ar_ptr) {
3532 p = _int_memalign(ar_ptr, alignment, bytes);
3533 (void)mutex_unlock(&ar_ptr->mutex);
3535 #endif
3538 assert(!p || chunk_is_mmapped(mem2chunk(p)) ||
3539 ar_ptr == arena_for_chunk(mem2chunk(p)));
3540 return p;
3542 #ifdef libc_hidden_def
3543 libc_hidden_def (public_mEMALIGn)
3544 #endif
3546 Void_t*
3547 public_vALLOc(size_t bytes)
3549 mstate ar_ptr;
3550 Void_t *p;
3552 if(__malloc_initialized < 0)
3553 ptmalloc_init ();
3555 __malloc_ptr_t (*hook) __MALLOC_PMT ((size_t, size_t,
3556 __const __malloc_ptr_t)) =
3557 __memalign_hook;
3558 if (hook != NULL)
3559 return (*hook)(mp_.pagesize, bytes, RETURN_ADDRESS (0));
3561 arena_get(ar_ptr, bytes + mp_.pagesize + MINSIZE);
3562 if(!ar_ptr)
3563 return 0;
3564 p = _int_valloc(ar_ptr, bytes);
3565 (void)mutex_unlock(&ar_ptr->mutex);
3566 return p;
3569 Void_t*
3570 public_pVALLOc(size_t bytes)
3572 mstate ar_ptr;
3573 Void_t *p;
3575 if(__malloc_initialized < 0)
3576 ptmalloc_init ();
3578 __malloc_ptr_t (*hook) __MALLOC_PMT ((size_t, size_t,
3579 __const __malloc_ptr_t)) =
3580 __memalign_hook;
3581 if (hook != NULL)
3582 return (*hook)(mp_.pagesize,
3583 (bytes + mp_.pagesize - 1) & ~(mp_.pagesize - 1),
3584 RETURN_ADDRESS (0));
3586 arena_get(ar_ptr, bytes + 2*mp_.pagesize + MINSIZE);
3587 p = _int_pvalloc(ar_ptr, bytes);
3588 (void)mutex_unlock(&ar_ptr->mutex);
3589 return p;
3592 Void_t*
3593 public_cALLOc(size_t n, size_t elem_size)
3595 mstate av;
3596 mchunkptr oldtop, p;
3597 INTERNAL_SIZE_T bytes, sz, csz, oldtopsize;
3598 Void_t* mem;
3599 unsigned long clearsize;
3600 unsigned long nclears;
3601 INTERNAL_SIZE_T* d;
3602 __malloc_ptr_t (*hook) __MALLOC_PMT ((size_t, __const __malloc_ptr_t)) =
3603 __malloc_hook;
3605 /* size_t is unsigned so the behavior on overflow is defined. */
3606 bytes = n * elem_size;
3607 #define HALF_INTERNAL_SIZE_T \
3608 (((INTERNAL_SIZE_T) 1) << (8 * sizeof (INTERNAL_SIZE_T) / 2))
3609 if (__builtin_expect ((n | elem_size) >= HALF_INTERNAL_SIZE_T, 0)) {
3610 if (elem_size != 0 && bytes / elem_size != n) {
3611 MALLOC_FAILURE_ACTION;
3612 return 0;
3616 if (hook != NULL) {
3617 sz = bytes;
3618 mem = (*hook)(sz, RETURN_ADDRESS (0));
3619 if(mem == 0)
3620 return 0;
3621 #ifdef HAVE_MEMCPY
3622 return memset(mem, 0, sz);
3623 #else
3624 while(sz > 0) ((char*)mem)[--sz] = 0; /* rather inefficient */
3625 return mem;
3626 #endif
3629 sz = bytes;
3631 arena_get(av, sz);
3632 if(!av)
3633 return 0;
3635 /* Check if we hand out the top chunk, in which case there may be no
3636 need to clear. */
3637 #if MORECORE_CLEARS
3638 oldtop = top(av);
3639 oldtopsize = chunksize(top(av));
3640 #if MORECORE_CLEARS < 2
3641 /* Only newly allocated memory is guaranteed to be cleared. */
3642 if (av == &main_arena &&
3643 oldtopsize < mp_.sbrk_base + av->max_system_mem - (char *)oldtop)
3644 oldtopsize = (mp_.sbrk_base + av->max_system_mem - (char *)oldtop);
3645 #endif
3646 #endif
3647 mem = _int_malloc(av, sz);
3649 /* Only clearing follows, so we can unlock early. */
3650 (void)mutex_unlock(&av->mutex);
3652 assert(!mem || chunk_is_mmapped(mem2chunk(mem)) ||
3653 av == arena_for_chunk(mem2chunk(mem)));
3655 if (mem == 0) {
3656 /* Maybe the failure is due to running out of mmapped areas. */
3657 if(av != &main_arena) {
3658 (void)mutex_lock(&main_arena.mutex);
3659 mem = _int_malloc(&main_arena, sz);
3660 (void)mutex_unlock(&main_arena.mutex);
3661 } else {
3662 #if USE_ARENAS
3663 /* ... or sbrk() has failed and there is still a chance to mmap() */
3664 (void)mutex_lock(&main_arena.mutex);
3665 av = arena_get2(av->next ? av : 0, sz);
3666 (void)mutex_unlock(&main_arena.mutex);
3667 if(av) {
3668 mem = _int_malloc(av, sz);
3669 (void)mutex_unlock(&av->mutex);
3671 #endif
3673 if (mem == 0) return 0;
3675 p = mem2chunk(mem);
3677 /* Two optional cases in which clearing not necessary */
3678 #if HAVE_MMAP
3679 if (chunk_is_mmapped(p))
3680 return mem;
3681 #endif
3683 csz = chunksize(p);
3685 #if MORECORE_CLEARS
3686 if (p == oldtop && csz > oldtopsize) {
3687 /* clear only the bytes from non-freshly-sbrked memory */
3688 csz = oldtopsize;
3690 #endif
3692 /* Unroll clear of <= 36 bytes (72 if 8byte sizes). We know that
3693 contents have an odd number of INTERNAL_SIZE_T-sized words;
3694 minimally 3. */
3695 d = (INTERNAL_SIZE_T*)mem;
3696 clearsize = csz - SIZE_SZ;
3697 nclears = clearsize / sizeof(INTERNAL_SIZE_T);
3698 assert(nclears >= 3);
3700 if (nclears > 9)
3701 MALLOC_ZERO(d, clearsize);
3703 else {
3704 *(d+0) = 0;
3705 *(d+1) = 0;
3706 *(d+2) = 0;
3707 if (nclears > 4) {
3708 *(d+3) = 0;
3709 *(d+4) = 0;
3710 if (nclears > 6) {
3711 *(d+5) = 0;
3712 *(d+6) = 0;
3713 if (nclears > 8) {
3714 *(d+7) = 0;
3715 *(d+8) = 0;
3721 return mem;
3724 Void_t**
3725 public_iCALLOc(size_t n, size_t elem_size, Void_t** chunks)
3727 mstate ar_ptr;
3728 Void_t** m;
3730 arena_get(ar_ptr, n*elem_size);
3731 if(!ar_ptr)
3732 return 0;
3734 m = _int_icalloc(ar_ptr, n, elem_size, chunks);
3735 (void)mutex_unlock(&ar_ptr->mutex);
3736 return m;
3739 Void_t**
3740 public_iCOMALLOc(size_t n, size_t sizes[], Void_t** chunks)
3742 mstate ar_ptr;
3743 Void_t** m;
3745 arena_get(ar_ptr, 0);
3746 if(!ar_ptr)
3747 return 0;
3749 m = _int_icomalloc(ar_ptr, n, sizes, chunks);
3750 (void)mutex_unlock(&ar_ptr->mutex);
3751 return m;
3754 #ifndef _LIBC
3756 void
3757 public_cFREe(Void_t* m)
3759 public_fREe(m);
3762 #endif /* _LIBC */
3765 public_mTRIm(size_t s)
3767 int result;
3769 (void)mutex_lock(&main_arena.mutex);
3770 result = mTRIm(s);
3771 (void)mutex_unlock(&main_arena.mutex);
3772 return result;
3775 size_t
3776 public_mUSABLe(Void_t* m)
3778 size_t result;
3780 result = mUSABLe(m);
3781 return result;
3784 void
3785 public_mSTATs()
3787 mSTATs();
3790 struct mallinfo public_mALLINFo()
3792 struct mallinfo m;
3794 if(__malloc_initialized < 0)
3795 ptmalloc_init ();
3796 (void)mutex_lock(&main_arena.mutex);
3797 m = mALLINFo(&main_arena);
3798 (void)mutex_unlock(&main_arena.mutex);
3799 return m;
3803 public_mALLOPt(int p, int v)
3805 int result;
3806 result = mALLOPt(p, v);
3807 return result;
3811 ------------------------------ malloc ------------------------------
3814 Void_t*
3815 _int_malloc(mstate av, size_t bytes)
3817 INTERNAL_SIZE_T nb; /* normalized request size */
3818 unsigned int idx; /* associated bin index */
3819 mbinptr bin; /* associated bin */
3820 mfastbinptr* fb; /* associated fastbin */
3822 mchunkptr victim; /* inspected/selected chunk */
3823 INTERNAL_SIZE_T size; /* its size */
3824 int victim_index; /* its bin index */
3826 mchunkptr remainder; /* remainder from a split */
3827 unsigned long remainder_size; /* its size */
3829 unsigned int block; /* bit map traverser */
3830 unsigned int bit; /* bit map traverser */
3831 unsigned int map; /* current word of binmap */
3833 mchunkptr fwd; /* misc temp for linking */
3834 mchunkptr bck; /* misc temp for linking */
3837 Convert request size to internal form by adding SIZE_SZ bytes
3838 overhead plus possibly more to obtain necessary alignment and/or
3839 to obtain a size of at least MINSIZE, the smallest allocatable
3840 size. Also, checked_request2size traps (returning 0) request sizes
3841 that are so large that they wrap around zero when padded and
3842 aligned.
3845 checked_request2size(bytes, nb);
3848 If the size qualifies as a fastbin, first check corresponding bin.
3849 This code is safe to execute even if av is not yet initialized, so we
3850 can try it without checking, which saves some time on this fast path.
3853 if ((unsigned long)(nb) <= (unsigned long)(av->max_fast)) {
3854 long int idx = fastbin_index(nb);
3855 fb = &(av->fastbins[idx]);
3856 if ( (victim = *fb) != 0) {
3857 if (__builtin_expect (fastbin_index (chunksize (victim)) != idx, 0))
3858 malloc_printerr (check_action, "malloc(): memory corruption (fast)",
3859 chunk2mem (victim));
3860 *fb = victim->fd;
3861 check_remalloced_chunk(av, victim, nb);
3862 return chunk2mem(victim);
3867 If a small request, check regular bin. Since these "smallbins"
3868 hold one size each, no searching within bins is necessary.
3869 (For a large request, we need to wait until unsorted chunks are
3870 processed to find best fit. But for small ones, fits are exact
3871 anyway, so we can check now, which is faster.)
3874 if (in_smallbin_range(nb)) {
3875 idx = smallbin_index(nb);
3876 bin = bin_at(av,idx);
3878 if ( (victim = last(bin)) != bin) {
3879 if (victim == 0) /* initialization check */
3880 malloc_consolidate(av);
3881 else {
3882 bck = victim->bk;
3883 set_inuse_bit_at_offset(victim, nb);
3884 bin->bk = bck;
3885 bck->fd = bin;
3887 if (av != &main_arena)
3888 victim->size |= NON_MAIN_ARENA;
3889 check_malloced_chunk(av, victim, nb);
3890 return chunk2mem(victim);
3896 If this is a large request, consolidate fastbins before continuing.
3897 While it might look excessive to kill all fastbins before
3898 even seeing if there is space available, this avoids
3899 fragmentation problems normally associated with fastbins.
3900 Also, in practice, programs tend to have runs of either small or
3901 large requests, but less often mixtures, so consolidation is not
3902 invoked all that often in most programs. And the programs that
3903 it is called frequently in otherwise tend to fragment.
3906 else {
3907 idx = largebin_index(nb);
3908 if (have_fastchunks(av))
3909 malloc_consolidate(av);
3913 Process recently freed or remaindered chunks, taking one only if
3914 it is exact fit, or, if this a small request, the chunk is remainder from
3915 the most recent non-exact fit. Place other traversed chunks in
3916 bins. Note that this step is the only place in any routine where
3917 chunks are placed in bins.
3919 The outer loop here is needed because we might not realize until
3920 near the end of malloc that we should have consolidated, so must
3921 do so and retry. This happens at most once, and only when we would
3922 otherwise need to expand memory to service a "small" request.
3925 for(;;) {
3927 while ( (victim = unsorted_chunks(av)->bk) != unsorted_chunks(av)) {
3928 bck = victim->bk;
3929 if (__builtin_expect (victim->size <= 2 * SIZE_SZ, 0)
3930 || __builtin_expect (victim->size > av->system_mem, 0))
3931 malloc_printerr (check_action, "malloc(): memory corruption",
3932 chunk2mem (victim));
3933 size = chunksize(victim);
3936 If a small request, try to use last remainder if it is the
3937 only chunk in unsorted bin. This helps promote locality for
3938 runs of consecutive small requests. This is the only
3939 exception to best-fit, and applies only when there is
3940 no exact fit for a small chunk.
3943 if (in_smallbin_range(nb) &&
3944 bck == unsorted_chunks(av) &&
3945 victim == av->last_remainder &&
3946 (unsigned long)(size) > (unsigned long)(nb + MINSIZE)) {
3948 /* split and reattach remainder */
3949 remainder_size = size - nb;
3950 remainder = chunk_at_offset(victim, nb);
3951 unsorted_chunks(av)->bk = unsorted_chunks(av)->fd = remainder;
3952 av->last_remainder = remainder;
3953 remainder->bk = remainder->fd = unsorted_chunks(av);
3955 set_head(victim, nb | PREV_INUSE |
3956 (av != &main_arena ? NON_MAIN_ARENA : 0));
3957 set_head(remainder, remainder_size | PREV_INUSE);
3958 set_foot(remainder, remainder_size);
3960 check_malloced_chunk(av, victim, nb);
3961 return chunk2mem(victim);
3964 /* remove from unsorted list */
3965 unsorted_chunks(av)->bk = bck;
3966 bck->fd = unsorted_chunks(av);
3968 /* Take now instead of binning if exact fit */
3970 if (size == nb) {
3971 set_inuse_bit_at_offset(victim, size);
3972 if (av != &main_arena)
3973 victim->size |= NON_MAIN_ARENA;
3974 check_malloced_chunk(av, victim, nb);
3975 return chunk2mem(victim);
3978 /* place chunk in bin */
3980 if (in_smallbin_range(size)) {
3981 victim_index = smallbin_index(size);
3982 bck = bin_at(av, victim_index);
3983 fwd = bck->fd;
3985 else {
3986 victim_index = largebin_index(size);
3987 bck = bin_at(av, victim_index);
3988 fwd = bck->fd;
3990 /* maintain large bins in sorted order */
3991 if (fwd != bck) {
3992 /* Or with inuse bit to speed comparisons */
3993 size |= PREV_INUSE;
3994 /* if smaller than smallest, bypass loop below */
3995 assert((bck->bk->size & NON_MAIN_ARENA) == 0);
3996 if ((unsigned long)(size) <= (unsigned long)(bck->bk->size)) {
3997 fwd = bck;
3998 bck = bck->bk;
4000 else {
4001 assert((fwd->size & NON_MAIN_ARENA) == 0);
4002 while ((unsigned long)(size) < (unsigned long)(fwd->size)) {
4003 fwd = fwd->fd;
4004 assert((fwd->size & NON_MAIN_ARENA) == 0);
4006 bck = fwd->bk;
4011 mark_bin(av, victim_index);
4012 victim->bk = bck;
4013 victim->fd = fwd;
4014 fwd->bk = victim;
4015 bck->fd = victim;
4019 If a large request, scan through the chunks of current bin in
4020 sorted order to find smallest that fits. This is the only step
4021 where an unbounded number of chunks might be scanned without doing
4022 anything useful with them. However the lists tend to be short.
4025 if (!in_smallbin_range(nb)) {
4026 bin = bin_at(av, idx);
4028 /* skip scan if empty or largest chunk is too small */
4029 if ((victim = last(bin)) != bin &&
4030 (unsigned long)(first(bin)->size) >= (unsigned long)(nb)) {
4032 while (((unsigned long)(size = chunksize(victim)) <
4033 (unsigned long)(nb)))
4034 victim = victim->bk;
4036 remainder_size = size - nb;
4037 unlink(victim, bck, fwd);
4039 /* Exhaust */
4040 if (remainder_size < MINSIZE) {
4041 set_inuse_bit_at_offset(victim, size);
4042 if (av != &main_arena)
4043 victim->size |= NON_MAIN_ARENA;
4044 check_malloced_chunk(av, victim, nb);
4045 return chunk2mem(victim);
4047 /* Split */
4048 else {
4049 remainder = chunk_at_offset(victim, nb);
4050 unsorted_chunks(av)->bk = unsorted_chunks(av)->fd = remainder;
4051 remainder->bk = remainder->fd = unsorted_chunks(av);
4052 set_head(victim, nb | PREV_INUSE |
4053 (av != &main_arena ? NON_MAIN_ARENA : 0));
4054 set_head(remainder, remainder_size | PREV_INUSE);
4055 set_foot(remainder, remainder_size);
4056 check_malloced_chunk(av, victim, nb);
4057 return chunk2mem(victim);
4063 Search for a chunk by scanning bins, starting with next largest
4064 bin. This search is strictly by best-fit; i.e., the smallest
4065 (with ties going to approximately the least recently used) chunk
4066 that fits is selected.
4068 The bitmap avoids needing to check that most blocks are nonempty.
4069 The particular case of skipping all bins during warm-up phases
4070 when no chunks have been returned yet is faster than it might look.
4073 ++idx;
4074 bin = bin_at(av,idx);
4075 block = idx2block(idx);
4076 map = av->binmap[block];
4077 bit = idx2bit(idx);
4079 for (;;) {
4081 /* Skip rest of block if there are no more set bits in this block. */
4082 if (bit > map || bit == 0) {
4083 do {
4084 if (++block >= BINMAPSIZE) /* out of bins */
4085 goto use_top;
4086 } while ( (map = av->binmap[block]) == 0);
4088 bin = bin_at(av, (block << BINMAPSHIFT));
4089 bit = 1;
4092 /* Advance to bin with set bit. There must be one. */
4093 while ((bit & map) == 0) {
4094 bin = next_bin(bin);
4095 bit <<= 1;
4096 assert(bit != 0);
4099 /* Inspect the bin. It is likely to be non-empty */
4100 victim = last(bin);
4102 /* If a false alarm (empty bin), clear the bit. */
4103 if (victim == bin) {
4104 av->binmap[block] = map &= ~bit; /* Write through */
4105 bin = next_bin(bin);
4106 bit <<= 1;
4109 else {
4110 size = chunksize(victim);
4112 /* We know the first chunk in this bin is big enough to use. */
4113 assert((unsigned long)(size) >= (unsigned long)(nb));
4115 remainder_size = size - nb;
4117 /* unlink */
4118 bck = victim->bk;
4119 bin->bk = bck;
4120 bck->fd = bin;
4122 /* Exhaust */
4123 if (remainder_size < MINSIZE) {
4124 set_inuse_bit_at_offset(victim, size);
4125 if (av != &main_arena)
4126 victim->size |= NON_MAIN_ARENA;
4127 check_malloced_chunk(av, victim, nb);
4128 return chunk2mem(victim);
4131 /* Split */
4132 else {
4133 remainder = chunk_at_offset(victim, nb);
4135 unsorted_chunks(av)->bk = unsorted_chunks(av)->fd = remainder;
4136 remainder->bk = remainder->fd = unsorted_chunks(av);
4137 /* advertise as last remainder */
4138 if (in_smallbin_range(nb))
4139 av->last_remainder = remainder;
4141 set_head(victim, nb | PREV_INUSE |
4142 (av != &main_arena ? NON_MAIN_ARENA : 0));
4143 set_head(remainder, remainder_size | PREV_INUSE);
4144 set_foot(remainder, remainder_size);
4145 check_malloced_chunk(av, victim, nb);
4146 return chunk2mem(victim);
4151 use_top:
4153 If large enough, split off the chunk bordering the end of memory
4154 (held in av->top). Note that this is in accord with the best-fit
4155 search rule. In effect, av->top is treated as larger (and thus
4156 less well fitting) than any other available chunk since it can
4157 be extended to be as large as necessary (up to system
4158 limitations).
4160 We require that av->top always exists (i.e., has size >=
4161 MINSIZE) after initialization, so if it would otherwise be
4162 exhuasted by current request, it is replenished. (The main
4163 reason for ensuring it exists is that we may need MINSIZE space
4164 to put in fenceposts in sysmalloc.)
4167 victim = av->top;
4168 size = chunksize(victim);
4170 if ((unsigned long)(size) >= (unsigned long)(nb + MINSIZE)) {
4171 remainder_size = size - nb;
4172 remainder = chunk_at_offset(victim, nb);
4173 av->top = remainder;
4174 set_head(victim, nb | PREV_INUSE |
4175 (av != &main_arena ? NON_MAIN_ARENA : 0));
4176 set_head(remainder, remainder_size | PREV_INUSE);
4178 check_malloced_chunk(av, victim, nb);
4179 return chunk2mem(victim);
4183 If there is space available in fastbins, consolidate and retry,
4184 to possibly avoid expanding memory. This can occur only if nb is
4185 in smallbin range so we didn't consolidate upon entry.
4188 else if (have_fastchunks(av)) {
4189 assert(in_smallbin_range(nb));
4190 malloc_consolidate(av);
4191 idx = smallbin_index(nb); /* restore original bin index */
4195 Otherwise, relay to handle system-dependent cases
4197 else
4198 return sYSMALLOc(nb, av);
4203 ------------------------------ free ------------------------------
4206 void
4207 _int_free(mstate av, Void_t* mem)
4209 mchunkptr p; /* chunk corresponding to mem */
4210 INTERNAL_SIZE_T size; /* its size */
4211 mfastbinptr* fb; /* associated fastbin */
4212 mchunkptr nextchunk; /* next contiguous chunk */
4213 INTERNAL_SIZE_T nextsize; /* its size */
4214 int nextinuse; /* true if nextchunk is used */
4215 INTERNAL_SIZE_T prevsize; /* size of previous contiguous chunk */
4216 mchunkptr bck; /* misc temp for linking */
4217 mchunkptr fwd; /* misc temp for linking */
4219 const char *errstr = NULL;
4221 p = mem2chunk(mem);
4222 size = chunksize(p);
4224 /* Little security check which won't hurt performance: the
4225 allocator never wrapps around at the end of the address space.
4226 Therefore we can exclude some size values which might appear
4227 here by accident or by "design" from some intruder. */
4228 if (__builtin_expect ((uintptr_t) p > (uintptr_t) -size, 0)
4229 || __builtin_expect ((uintptr_t) p & MALLOC_ALIGN_MASK, 0))
4231 errstr = "free(): invalid pointer";
4232 errout:
4233 malloc_printerr (check_action, errstr, mem);
4234 return;
4237 check_inuse_chunk(av, p);
4240 If eligible, place chunk on a fastbin so it can be found
4241 and used quickly in malloc.
4244 if ((unsigned long)(size) <= (unsigned long)(av->max_fast)
4246 #if TRIM_FASTBINS
4248 If TRIM_FASTBINS set, don't place chunks
4249 bordering top into fastbins
4251 && (chunk_at_offset(p, size) != av->top)
4252 #endif
4255 if (__builtin_expect (chunk_at_offset (p, size)->size <= 2 * SIZE_SZ, 0)
4256 || __builtin_expect (chunksize (chunk_at_offset (p, size))
4257 >= av->system_mem, 0))
4259 errstr = "free(): invalid next size (fast)";
4260 goto errout;
4263 set_fastchunks(av);
4264 fb = &(av->fastbins[fastbin_index(size)]);
4265 /* Another simple check: make sure the top of the bin is not the
4266 record we are going to add (i.e., double free). */
4267 if (__builtin_expect (*fb == p, 0))
4269 errstr = "double free or corruption (fasttop)";
4270 goto errout;
4272 p->fd = *fb;
4273 *fb = p;
4277 Consolidate other non-mmapped chunks as they arrive.
4280 else if (!chunk_is_mmapped(p)) {
4281 nextchunk = chunk_at_offset(p, size);
4283 /* Lightweight tests: check whether the block is already the
4284 top block. */
4285 if (__builtin_expect (p == av->top, 0))
4287 errstr = "double free or corruption (top)";
4288 goto errout;
4290 /* Or whether the next chunk is beyond the boundaries of the arena. */
4291 if (__builtin_expect (contiguous (av)
4292 && (char *) nextchunk
4293 >= ((char *) av->top + chunksize(av->top)), 0))
4295 errstr = "double free or corruption (out)";
4296 goto errout;
4298 /* Or whether the block is actually not marked used. */
4299 if (__builtin_expect (!prev_inuse(nextchunk), 0))
4301 errstr = "double free or corruption (!prev)";
4302 goto errout;
4305 nextsize = chunksize(nextchunk);
4306 if (__builtin_expect (nextchunk->size <= 2 * SIZE_SZ, 0)
4307 || __builtin_expect (nextsize >= av->system_mem, 0))
4309 errstr = "free(): invalid next size (normal)";
4310 goto errout;
4313 /* consolidate backward */
4314 if (!prev_inuse(p)) {
4315 prevsize = p->prev_size;
4316 size += prevsize;
4317 p = chunk_at_offset(p, -((long) prevsize));
4318 unlink(p, bck, fwd);
4321 if (nextchunk != av->top) {
4322 /* get and clear inuse bit */
4323 nextinuse = inuse_bit_at_offset(nextchunk, nextsize);
4325 /* consolidate forward */
4326 if (!nextinuse) {
4327 unlink(nextchunk, bck, fwd);
4328 size += nextsize;
4329 } else
4330 clear_inuse_bit_at_offset(nextchunk, 0);
4333 Place the chunk in unsorted chunk list. Chunks are
4334 not placed into regular bins until after they have
4335 been given one chance to be used in malloc.
4338 bck = unsorted_chunks(av);
4339 fwd = bck->fd;
4340 p->bk = bck;
4341 p->fd = fwd;
4342 bck->fd = p;
4343 fwd->bk = p;
4345 set_head(p, size | PREV_INUSE);
4346 set_foot(p, size);
4348 check_free_chunk(av, p);
4352 If the chunk borders the current high end of memory,
4353 consolidate into top
4356 else {
4357 size += nextsize;
4358 set_head(p, size | PREV_INUSE);
4359 av->top = p;
4360 check_chunk(av, p);
4364 If freeing a large space, consolidate possibly-surrounding
4365 chunks. Then, if the total unused topmost memory exceeds trim
4366 threshold, ask malloc_trim to reduce top.
4368 Unless max_fast is 0, we don't know if there are fastbins
4369 bordering top, so we cannot tell for sure whether threshold
4370 has been reached unless fastbins are consolidated. But we
4371 don't want to consolidate on each free. As a compromise,
4372 consolidation is performed if FASTBIN_CONSOLIDATION_THRESHOLD
4373 is reached.
4376 if ((unsigned long)(size) >= FASTBIN_CONSOLIDATION_THRESHOLD) {
4377 if (have_fastchunks(av))
4378 malloc_consolidate(av);
4380 if (av == &main_arena) {
4381 #ifndef MORECORE_CANNOT_TRIM
4382 if ((unsigned long)(chunksize(av->top)) >=
4383 (unsigned long)(mp_.trim_threshold))
4384 sYSTRIm(mp_.top_pad, av);
4385 #endif
4386 } else {
4387 /* Always try heap_trim(), even if the top chunk is not
4388 large, because the corresponding heap might go away. */
4389 heap_info *heap = heap_for_ptr(top(av));
4391 assert(heap->ar_ptr == av);
4392 heap_trim(heap, mp_.top_pad);
4398 If the chunk was allocated via mmap, release via munmap(). Note
4399 that if HAVE_MMAP is false but chunk_is_mmapped is true, then
4400 user must have overwritten memory. There's nothing we can do to
4401 catch this error unless MALLOC_DEBUG is set, in which case
4402 check_inuse_chunk (above) will have triggered error.
4405 else {
4406 #if HAVE_MMAP
4407 munmap_chunk (p);
4408 #endif
4413 ------------------------- malloc_consolidate -------------------------
4415 malloc_consolidate is a specialized version of free() that tears
4416 down chunks held in fastbins. Free itself cannot be used for this
4417 purpose since, among other things, it might place chunks back onto
4418 fastbins. So, instead, we need to use a minor variant of the same
4419 code.
4421 Also, because this routine needs to be called the first time through
4422 malloc anyway, it turns out to be the perfect place to trigger
4423 initialization code.
4426 #if __STD_C
4427 static void malloc_consolidate(mstate av)
4428 #else
4429 static void malloc_consolidate(av) mstate av;
4430 #endif
4432 mfastbinptr* fb; /* current fastbin being consolidated */
4433 mfastbinptr* maxfb; /* last fastbin (for loop control) */
4434 mchunkptr p; /* current chunk being consolidated */
4435 mchunkptr nextp; /* next chunk to consolidate */
4436 mchunkptr unsorted_bin; /* bin header */
4437 mchunkptr first_unsorted; /* chunk to link to */
4439 /* These have same use as in free() */
4440 mchunkptr nextchunk;
4441 INTERNAL_SIZE_T size;
4442 INTERNAL_SIZE_T nextsize;
4443 INTERNAL_SIZE_T prevsize;
4444 int nextinuse;
4445 mchunkptr bck;
4446 mchunkptr fwd;
4449 If max_fast is 0, we know that av hasn't
4450 yet been initialized, in which case do so below
4453 if (av->max_fast != 0) {
4454 clear_fastchunks(av);
4456 unsorted_bin = unsorted_chunks(av);
4459 Remove each chunk from fast bin and consolidate it, placing it
4460 then in unsorted bin. Among other reasons for doing this,
4461 placing in unsorted bin avoids needing to calculate actual bins
4462 until malloc is sure that chunks aren't immediately going to be
4463 reused anyway.
4466 maxfb = &(av->fastbins[fastbin_index(av->max_fast)]);
4467 fb = &(av->fastbins[0]);
4468 do {
4469 if ( (p = *fb) != 0) {
4470 *fb = 0;
4472 do {
4473 check_inuse_chunk(av, p);
4474 nextp = p->fd;
4476 /* Slightly streamlined version of consolidation code in free() */
4477 size = p->size & ~(PREV_INUSE|NON_MAIN_ARENA);
4478 nextchunk = chunk_at_offset(p, size);
4479 nextsize = chunksize(nextchunk);
4481 if (!prev_inuse(p)) {
4482 prevsize = p->prev_size;
4483 size += prevsize;
4484 p = chunk_at_offset(p, -((long) prevsize));
4485 unlink(p, bck, fwd);
4488 if (nextchunk != av->top) {
4489 nextinuse = inuse_bit_at_offset(nextchunk, nextsize);
4491 if (!nextinuse) {
4492 size += nextsize;
4493 unlink(nextchunk, bck, fwd);
4494 } else
4495 clear_inuse_bit_at_offset(nextchunk, 0);
4497 first_unsorted = unsorted_bin->fd;
4498 unsorted_bin->fd = p;
4499 first_unsorted->bk = p;
4501 set_head(p, size | PREV_INUSE);
4502 p->bk = unsorted_bin;
4503 p->fd = first_unsorted;
4504 set_foot(p, size);
4507 else {
4508 size += nextsize;
4509 set_head(p, size | PREV_INUSE);
4510 av->top = p;
4513 } while ( (p = nextp) != 0);
4516 } while (fb++ != maxfb);
4518 else {
4519 malloc_init_state(av);
4520 check_malloc_state(av);
4525 ------------------------------ realloc ------------------------------
4528 Void_t*
4529 _int_realloc(mstate av, Void_t* oldmem, size_t bytes)
4531 INTERNAL_SIZE_T nb; /* padded request size */
4533 mchunkptr oldp; /* chunk corresponding to oldmem */
4534 INTERNAL_SIZE_T oldsize; /* its size */
4536 mchunkptr newp; /* chunk to return */
4537 INTERNAL_SIZE_T newsize; /* its size */
4538 Void_t* newmem; /* corresponding user mem */
4540 mchunkptr next; /* next contiguous chunk after oldp */
4542 mchunkptr remainder; /* extra space at end of newp */
4543 unsigned long remainder_size; /* its size */
4545 mchunkptr bck; /* misc temp for linking */
4546 mchunkptr fwd; /* misc temp for linking */
4548 unsigned long copysize; /* bytes to copy */
4549 unsigned int ncopies; /* INTERNAL_SIZE_T words to copy */
4550 INTERNAL_SIZE_T* s; /* copy source */
4551 INTERNAL_SIZE_T* d; /* copy destination */
4553 const char *errstr = NULL;
4556 checked_request2size(bytes, nb);
4558 oldp = mem2chunk(oldmem);
4559 oldsize = chunksize(oldp);
4561 /* Simple tests for old block integrity. */
4562 if (__builtin_expect ((uintptr_t) oldp & MALLOC_ALIGN_MASK, 0))
4564 errstr = "realloc(): invalid pointer";
4565 errout:
4566 malloc_printerr (check_action, errstr, oldmem);
4567 return NULL;
4569 if (__builtin_expect (oldp->size <= 2 * SIZE_SZ, 0)
4570 || __builtin_expect (oldsize >= av->system_mem, 0))
4572 errstr = "realloc(): invalid size";
4573 goto errout;
4576 check_inuse_chunk(av, oldp);
4578 if (!chunk_is_mmapped(oldp)) {
4580 next = chunk_at_offset(oldp, oldsize);
4581 INTERNAL_SIZE_T nextsize = chunksize(next);
4582 if (__builtin_expect (next->size <= 2 * SIZE_SZ, 0)
4583 || __builtin_expect (nextsize >= av->system_mem, 0))
4585 errstr = "realloc(): invalid next size";
4586 goto errout;
4589 if ((unsigned long)(oldsize) >= (unsigned long)(nb)) {
4590 /* already big enough; split below */
4591 newp = oldp;
4592 newsize = oldsize;
4595 else {
4596 /* Try to expand forward into top */
4597 if (next == av->top &&
4598 (unsigned long)(newsize = oldsize + nextsize) >=
4599 (unsigned long)(nb + MINSIZE)) {
4600 set_head_size(oldp, nb | (av != &main_arena ? NON_MAIN_ARENA : 0));
4601 av->top = chunk_at_offset(oldp, nb);
4602 set_head(av->top, (newsize - nb) | PREV_INUSE);
4603 check_inuse_chunk(av, oldp);
4604 return chunk2mem(oldp);
4607 /* Try to expand forward into next chunk; split off remainder below */
4608 else if (next != av->top &&
4609 !inuse(next) &&
4610 (unsigned long)(newsize = oldsize + nextsize) >=
4611 (unsigned long)(nb)) {
4612 newp = oldp;
4613 unlink(next, bck, fwd);
4616 /* allocate, copy, free */
4617 else {
4618 newmem = _int_malloc(av, nb - MALLOC_ALIGN_MASK);
4619 if (newmem == 0)
4620 return 0; /* propagate failure */
4622 newp = mem2chunk(newmem);
4623 newsize = chunksize(newp);
4626 Avoid copy if newp is next chunk after oldp.
4628 if (newp == next) {
4629 newsize += oldsize;
4630 newp = oldp;
4632 else {
4634 Unroll copy of <= 36 bytes (72 if 8byte sizes)
4635 We know that contents have an odd number of
4636 INTERNAL_SIZE_T-sized words; minimally 3.
4639 copysize = oldsize - SIZE_SZ;
4640 s = (INTERNAL_SIZE_T*)(oldmem);
4641 d = (INTERNAL_SIZE_T*)(newmem);
4642 ncopies = copysize / sizeof(INTERNAL_SIZE_T);
4643 assert(ncopies >= 3);
4645 if (ncopies > 9)
4646 MALLOC_COPY(d, s, copysize);
4648 else {
4649 *(d+0) = *(s+0);
4650 *(d+1) = *(s+1);
4651 *(d+2) = *(s+2);
4652 if (ncopies > 4) {
4653 *(d+3) = *(s+3);
4654 *(d+4) = *(s+4);
4655 if (ncopies > 6) {
4656 *(d+5) = *(s+5);
4657 *(d+6) = *(s+6);
4658 if (ncopies > 8) {
4659 *(d+7) = *(s+7);
4660 *(d+8) = *(s+8);
4666 _int_free(av, oldmem);
4667 check_inuse_chunk(av, newp);
4668 return chunk2mem(newp);
4673 /* If possible, free extra space in old or extended chunk */
4675 assert((unsigned long)(newsize) >= (unsigned long)(nb));
4677 remainder_size = newsize - nb;
4679 if (remainder_size < MINSIZE) { /* not enough extra to split off */
4680 set_head_size(newp, newsize | (av != &main_arena ? NON_MAIN_ARENA : 0));
4681 set_inuse_bit_at_offset(newp, newsize);
4683 else { /* split remainder */
4684 remainder = chunk_at_offset(newp, nb);
4685 set_head_size(newp, nb | (av != &main_arena ? NON_MAIN_ARENA : 0));
4686 set_head(remainder, remainder_size | PREV_INUSE |
4687 (av != &main_arena ? NON_MAIN_ARENA : 0));
4688 /* Mark remainder as inuse so free() won't complain */
4689 set_inuse_bit_at_offset(remainder, remainder_size);
4690 _int_free(av, chunk2mem(remainder));
4693 check_inuse_chunk(av, newp);
4694 return chunk2mem(newp);
4698 Handle mmap cases
4701 else {
4702 #if HAVE_MMAP
4704 #if HAVE_MREMAP
4705 INTERNAL_SIZE_T offset = oldp->prev_size;
4706 size_t pagemask = mp_.pagesize - 1;
4707 char *cp;
4708 unsigned long sum;
4710 /* Note the extra SIZE_SZ overhead */
4711 newsize = (nb + offset + SIZE_SZ + pagemask) & ~pagemask;
4713 /* don't need to remap if still within same page */
4714 if (oldsize == newsize - offset)
4715 return oldmem;
4717 cp = (char*)mremap((char*)oldp - offset, oldsize + offset, newsize, 1);
4719 if (cp != MAP_FAILED) {
4721 newp = (mchunkptr)(cp + offset);
4722 set_head(newp, (newsize - offset)|IS_MMAPPED);
4724 assert(aligned_OK(chunk2mem(newp)));
4725 assert((newp->prev_size == offset));
4727 /* update statistics */
4728 sum = mp_.mmapped_mem += newsize - oldsize;
4729 if (sum > (unsigned long)(mp_.max_mmapped_mem))
4730 mp_.max_mmapped_mem = sum;
4731 #ifdef NO_THREADS
4732 sum += main_arena.system_mem;
4733 if (sum > (unsigned long)(mp_.max_total_mem))
4734 mp_.max_total_mem = sum;
4735 #endif
4737 return chunk2mem(newp);
4739 #endif
4741 /* Note the extra SIZE_SZ overhead. */
4742 if ((unsigned long)(oldsize) >= (unsigned long)(nb + SIZE_SZ))
4743 newmem = oldmem; /* do nothing */
4744 else {
4745 /* Must alloc, copy, free. */
4746 newmem = _int_malloc(av, nb - MALLOC_ALIGN_MASK);
4747 if (newmem != 0) {
4748 MALLOC_COPY(newmem, oldmem, oldsize - 2*SIZE_SZ);
4749 _int_free(av, oldmem);
4752 return newmem;
4754 #else
4755 /* If !HAVE_MMAP, but chunk_is_mmapped, user must have overwritten mem */
4756 check_malloc_state(av);
4757 MALLOC_FAILURE_ACTION;
4758 return 0;
4759 #endif
4764 ------------------------------ memalign ------------------------------
4767 Void_t*
4768 _int_memalign(mstate av, size_t alignment, size_t bytes)
4770 INTERNAL_SIZE_T nb; /* padded request size */
4771 char* m; /* memory returned by malloc call */
4772 mchunkptr p; /* corresponding chunk */
4773 char* brk; /* alignment point within p */
4774 mchunkptr newp; /* chunk to return */
4775 INTERNAL_SIZE_T newsize; /* its size */
4776 INTERNAL_SIZE_T leadsize; /* leading space before alignment point */
4777 mchunkptr remainder; /* spare room at end to split off */
4778 unsigned long remainder_size; /* its size */
4779 INTERNAL_SIZE_T size;
4781 /* If need less alignment than we give anyway, just relay to malloc */
4783 if (alignment <= MALLOC_ALIGNMENT) return _int_malloc(av, bytes);
4785 /* Otherwise, ensure that it is at least a minimum chunk size */
4787 if (alignment < MINSIZE) alignment = MINSIZE;
4789 /* Make sure alignment is power of 2 (in case MINSIZE is not). */
4790 if ((alignment & (alignment - 1)) != 0) {
4791 size_t a = MALLOC_ALIGNMENT * 2;
4792 while ((unsigned long)a < (unsigned long)alignment) a <<= 1;
4793 alignment = a;
4796 checked_request2size(bytes, nb);
4799 Strategy: find a spot within that chunk that meets the alignment
4800 request, and then possibly free the leading and trailing space.
4804 /* Call malloc with worst case padding to hit alignment. */
4806 m = (char*)(_int_malloc(av, nb + alignment + MINSIZE));
4808 if (m == 0) return 0; /* propagate failure */
4810 p = mem2chunk(m);
4812 if ((((unsigned long)(m)) % alignment) != 0) { /* misaligned */
4815 Find an aligned spot inside chunk. Since we need to give back
4816 leading space in a chunk of at least MINSIZE, if the first
4817 calculation places us at a spot with less than MINSIZE leader,
4818 we can move to the next aligned spot -- we've allocated enough
4819 total room so that this is always possible.
4822 brk = (char*)mem2chunk(((unsigned long)(m + alignment - 1)) &
4823 -((signed long) alignment));
4824 if ((unsigned long)(brk - (char*)(p)) < MINSIZE)
4825 brk += alignment;
4827 newp = (mchunkptr)brk;
4828 leadsize = brk - (char*)(p);
4829 newsize = chunksize(p) - leadsize;
4831 /* For mmapped chunks, just adjust offset */
4832 if (chunk_is_mmapped(p)) {
4833 newp->prev_size = p->prev_size + leadsize;
4834 set_head(newp, newsize|IS_MMAPPED);
4835 return chunk2mem(newp);
4838 /* Otherwise, give back leader, use the rest */
4839 set_head(newp, newsize | PREV_INUSE |
4840 (av != &main_arena ? NON_MAIN_ARENA : 0));
4841 set_inuse_bit_at_offset(newp, newsize);
4842 set_head_size(p, leadsize | (av != &main_arena ? NON_MAIN_ARENA : 0));
4843 _int_free(av, chunk2mem(p));
4844 p = newp;
4846 assert (newsize >= nb &&
4847 (((unsigned long)(chunk2mem(p))) % alignment) == 0);
4850 /* Also give back spare room at the end */
4851 if (!chunk_is_mmapped(p)) {
4852 size = chunksize(p);
4853 if ((unsigned long)(size) > (unsigned long)(nb + MINSIZE)) {
4854 remainder_size = size - nb;
4855 remainder = chunk_at_offset(p, nb);
4856 set_head(remainder, remainder_size | PREV_INUSE |
4857 (av != &main_arena ? NON_MAIN_ARENA : 0));
4858 set_head_size(p, nb);
4859 _int_free(av, chunk2mem(remainder));
4863 check_inuse_chunk(av, p);
4864 return chunk2mem(p);
4867 #if 0
4869 ------------------------------ calloc ------------------------------
4872 #if __STD_C
4873 Void_t* cALLOc(size_t n_elements, size_t elem_size)
4874 #else
4875 Void_t* cALLOc(n_elements, elem_size) size_t n_elements; size_t elem_size;
4876 #endif
4878 mchunkptr p;
4879 unsigned long clearsize;
4880 unsigned long nclears;
4881 INTERNAL_SIZE_T* d;
4883 Void_t* mem = mALLOc(n_elements * elem_size);
4885 if (mem != 0) {
4886 p = mem2chunk(mem);
4888 #if MMAP_CLEARS
4889 if (!chunk_is_mmapped(p)) /* don't need to clear mmapped space */
4890 #endif
4893 Unroll clear of <= 36 bytes (72 if 8byte sizes)
4894 We know that contents have an odd number of
4895 INTERNAL_SIZE_T-sized words; minimally 3.
4898 d = (INTERNAL_SIZE_T*)mem;
4899 clearsize = chunksize(p) - SIZE_SZ;
4900 nclears = clearsize / sizeof(INTERNAL_SIZE_T);
4901 assert(nclears >= 3);
4903 if (nclears > 9)
4904 MALLOC_ZERO(d, clearsize);
4906 else {
4907 *(d+0) = 0;
4908 *(d+1) = 0;
4909 *(d+2) = 0;
4910 if (nclears > 4) {
4911 *(d+3) = 0;
4912 *(d+4) = 0;
4913 if (nclears > 6) {
4914 *(d+5) = 0;
4915 *(d+6) = 0;
4916 if (nclears > 8) {
4917 *(d+7) = 0;
4918 *(d+8) = 0;
4925 return mem;
4927 #endif /* 0 */
4930 ------------------------- independent_calloc -------------------------
4933 Void_t**
4934 #if __STD_C
4935 _int_icalloc(mstate av, size_t n_elements, size_t elem_size, Void_t* chunks[])
4936 #else
4937 _int_icalloc(av, n_elements, elem_size, chunks)
4938 mstate av; size_t n_elements; size_t elem_size; Void_t* chunks[];
4939 #endif
4941 size_t sz = elem_size; /* serves as 1-element array */
4942 /* opts arg of 3 means all elements are same size, and should be cleared */
4943 return iALLOc(av, n_elements, &sz, 3, chunks);
4947 ------------------------- independent_comalloc -------------------------
4950 Void_t**
4951 #if __STD_C
4952 _int_icomalloc(mstate av, size_t n_elements, size_t sizes[], Void_t* chunks[])
4953 #else
4954 _int_icomalloc(av, n_elements, sizes, chunks)
4955 mstate av; size_t n_elements; size_t sizes[]; Void_t* chunks[];
4956 #endif
4958 return iALLOc(av, n_elements, sizes, 0, chunks);
4963 ------------------------------ ialloc ------------------------------
4964 ialloc provides common support for independent_X routines, handling all of
4965 the combinations that can result.
4967 The opts arg has:
4968 bit 0 set if all elements are same size (using sizes[0])
4969 bit 1 set if elements should be zeroed
4973 static Void_t**
4974 #if __STD_C
4975 iALLOc(mstate av, size_t n_elements, size_t* sizes, int opts, Void_t* chunks[])
4976 #else
4977 iALLOc(av, n_elements, sizes, opts, chunks)
4978 mstate av; size_t n_elements; size_t* sizes; int opts; Void_t* chunks[];
4979 #endif
4981 INTERNAL_SIZE_T element_size; /* chunksize of each element, if all same */
4982 INTERNAL_SIZE_T contents_size; /* total size of elements */
4983 INTERNAL_SIZE_T array_size; /* request size of pointer array */
4984 Void_t* mem; /* malloced aggregate space */
4985 mchunkptr p; /* corresponding chunk */
4986 INTERNAL_SIZE_T remainder_size; /* remaining bytes while splitting */
4987 Void_t** marray; /* either "chunks" or malloced ptr array */
4988 mchunkptr array_chunk; /* chunk for malloced ptr array */
4989 int mmx; /* to disable mmap */
4990 INTERNAL_SIZE_T size;
4991 INTERNAL_SIZE_T size_flags;
4992 size_t i;
4994 /* Ensure initialization/consolidation */
4995 if (have_fastchunks(av)) malloc_consolidate(av);
4997 /* compute array length, if needed */
4998 if (chunks != 0) {
4999 if (n_elements == 0)
5000 return chunks; /* nothing to do */
5001 marray = chunks;
5002 array_size = 0;
5004 else {
5005 /* if empty req, must still return chunk representing empty array */
5006 if (n_elements == 0)
5007 return (Void_t**) _int_malloc(av, 0);
5008 marray = 0;
5009 array_size = request2size(n_elements * (sizeof(Void_t*)));
5012 /* compute total element size */
5013 if (opts & 0x1) { /* all-same-size */
5014 element_size = request2size(*sizes);
5015 contents_size = n_elements * element_size;
5017 else { /* add up all the sizes */
5018 element_size = 0;
5019 contents_size = 0;
5020 for (i = 0; i != n_elements; ++i)
5021 contents_size += request2size(sizes[i]);
5024 /* subtract out alignment bytes from total to minimize overallocation */
5025 size = contents_size + array_size - MALLOC_ALIGN_MASK;
5028 Allocate the aggregate chunk.
5029 But first disable mmap so malloc won't use it, since
5030 we would not be able to later free/realloc space internal
5031 to a segregated mmap region.
5033 mmx = mp_.n_mmaps_max; /* disable mmap */
5034 mp_.n_mmaps_max = 0;
5035 mem = _int_malloc(av, size);
5036 mp_.n_mmaps_max = mmx; /* reset mmap */
5037 if (mem == 0)
5038 return 0;
5040 p = mem2chunk(mem);
5041 assert(!chunk_is_mmapped(p));
5042 remainder_size = chunksize(p);
5044 if (opts & 0x2) { /* optionally clear the elements */
5045 MALLOC_ZERO(mem, remainder_size - SIZE_SZ - array_size);
5048 size_flags = PREV_INUSE | (av != &main_arena ? NON_MAIN_ARENA : 0);
5050 /* If not provided, allocate the pointer array as final part of chunk */
5051 if (marray == 0) {
5052 array_chunk = chunk_at_offset(p, contents_size);
5053 marray = (Void_t**) (chunk2mem(array_chunk));
5054 set_head(array_chunk, (remainder_size - contents_size) | size_flags);
5055 remainder_size = contents_size;
5058 /* split out elements */
5059 for (i = 0; ; ++i) {
5060 marray[i] = chunk2mem(p);
5061 if (i != n_elements-1) {
5062 if (element_size != 0)
5063 size = element_size;
5064 else
5065 size = request2size(sizes[i]);
5066 remainder_size -= size;
5067 set_head(p, size | size_flags);
5068 p = chunk_at_offset(p, size);
5070 else { /* the final element absorbs any overallocation slop */
5071 set_head(p, remainder_size | size_flags);
5072 break;
5076 #if MALLOC_DEBUG
5077 if (marray != chunks) {
5078 /* final element must have exactly exhausted chunk */
5079 if (element_size != 0)
5080 assert(remainder_size == element_size);
5081 else
5082 assert(remainder_size == request2size(sizes[i]));
5083 check_inuse_chunk(av, mem2chunk(marray));
5086 for (i = 0; i != n_elements; ++i)
5087 check_inuse_chunk(av, mem2chunk(marray[i]));
5088 #endif
5090 return marray;
5095 ------------------------------ valloc ------------------------------
5098 Void_t*
5099 #if __STD_C
5100 _int_valloc(mstate av, size_t bytes)
5101 #else
5102 _int_valloc(av, bytes) mstate av; size_t bytes;
5103 #endif
5105 /* Ensure initialization/consolidation */
5106 if (have_fastchunks(av)) malloc_consolidate(av);
5107 return _int_memalign(av, mp_.pagesize, bytes);
5111 ------------------------------ pvalloc ------------------------------
5115 Void_t*
5116 #if __STD_C
5117 _int_pvalloc(mstate av, size_t bytes)
5118 #else
5119 _int_pvalloc(av, bytes) mstate av, size_t bytes;
5120 #endif
5122 size_t pagesz;
5124 /* Ensure initialization/consolidation */
5125 if (have_fastchunks(av)) malloc_consolidate(av);
5126 pagesz = mp_.pagesize;
5127 return _int_memalign(av, pagesz, (bytes + pagesz - 1) & ~(pagesz - 1));
5132 ------------------------------ malloc_trim ------------------------------
5135 #if __STD_C
5136 int mTRIm(size_t pad)
5137 #else
5138 int mTRIm(pad) size_t pad;
5139 #endif
5141 mstate av = &main_arena; /* already locked */
5143 /* Ensure initialization/consolidation */
5144 malloc_consolidate(av);
5146 #ifndef MORECORE_CANNOT_TRIM
5147 return sYSTRIm(pad, av);
5148 #else
5149 return 0;
5150 #endif
5155 ------------------------- malloc_usable_size -------------------------
5158 #if __STD_C
5159 size_t mUSABLe(Void_t* mem)
5160 #else
5161 size_t mUSABLe(mem) Void_t* mem;
5162 #endif
5164 mchunkptr p;
5165 if (mem != 0) {
5166 p = mem2chunk(mem);
5167 if (chunk_is_mmapped(p))
5168 return chunksize(p) - 2*SIZE_SZ;
5169 else if (inuse(p))
5170 return chunksize(p) - SIZE_SZ;
5172 return 0;
5176 ------------------------------ mallinfo ------------------------------
5179 struct mallinfo mALLINFo(mstate av)
5181 struct mallinfo mi;
5182 size_t i;
5183 mbinptr b;
5184 mchunkptr p;
5185 INTERNAL_SIZE_T avail;
5186 INTERNAL_SIZE_T fastavail;
5187 int nblocks;
5188 int nfastblocks;
5190 /* Ensure initialization */
5191 if (av->top == 0) malloc_consolidate(av);
5193 check_malloc_state(av);
5195 /* Account for top */
5196 avail = chunksize(av->top);
5197 nblocks = 1; /* top always exists */
5199 /* traverse fastbins */
5200 nfastblocks = 0;
5201 fastavail = 0;
5203 for (i = 0; i < NFASTBINS; ++i) {
5204 for (p = av->fastbins[i]; p != 0; p = p->fd) {
5205 ++nfastblocks;
5206 fastavail += chunksize(p);
5210 avail += fastavail;
5212 /* traverse regular bins */
5213 for (i = 1; i < NBINS; ++i) {
5214 b = bin_at(av, i);
5215 for (p = last(b); p != b; p = p->bk) {
5216 ++nblocks;
5217 avail += chunksize(p);
5221 mi.smblks = nfastblocks;
5222 mi.ordblks = nblocks;
5223 mi.fordblks = avail;
5224 mi.uordblks = av->system_mem - avail;
5225 mi.arena = av->system_mem;
5226 mi.hblks = mp_.n_mmaps;
5227 mi.hblkhd = mp_.mmapped_mem;
5228 mi.fsmblks = fastavail;
5229 mi.keepcost = chunksize(av->top);
5230 mi.usmblks = mp_.max_total_mem;
5231 return mi;
5235 ------------------------------ malloc_stats ------------------------------
5238 void mSTATs()
5240 int i;
5241 mstate ar_ptr;
5242 struct mallinfo mi;
5243 unsigned int in_use_b = mp_.mmapped_mem, system_b = in_use_b;
5244 #if THREAD_STATS
5245 long stat_lock_direct = 0, stat_lock_loop = 0, stat_lock_wait = 0;
5246 #endif
5248 if(__malloc_initialized < 0)
5249 ptmalloc_init ();
5250 #ifdef _LIBC
5251 _IO_flockfile (stderr);
5252 int old_flags2 = ((_IO_FILE *) stderr)->_flags2;
5253 ((_IO_FILE *) stderr)->_flags2 |= _IO_FLAGS2_NOTCANCEL;
5254 #endif
5255 for (i=0, ar_ptr = &main_arena;; i++) {
5256 (void)mutex_lock(&ar_ptr->mutex);
5257 mi = mALLINFo(ar_ptr);
5258 fprintf(stderr, "Arena %d:\n", i);
5259 fprintf(stderr, "system bytes = %10u\n", (unsigned int)mi.arena);
5260 fprintf(stderr, "in use bytes = %10u\n", (unsigned int)mi.uordblks);
5261 #if MALLOC_DEBUG > 1
5262 if (i > 0)
5263 dump_heap(heap_for_ptr(top(ar_ptr)));
5264 #endif
5265 system_b += mi.arena;
5266 in_use_b += mi.uordblks;
5267 #if THREAD_STATS
5268 stat_lock_direct += ar_ptr->stat_lock_direct;
5269 stat_lock_loop += ar_ptr->stat_lock_loop;
5270 stat_lock_wait += ar_ptr->stat_lock_wait;
5271 #endif
5272 (void)mutex_unlock(&ar_ptr->mutex);
5273 ar_ptr = ar_ptr->next;
5274 if(ar_ptr == &main_arena) break;
5276 #if HAVE_MMAP
5277 fprintf(stderr, "Total (incl. mmap):\n");
5278 #else
5279 fprintf(stderr, "Total:\n");
5280 #endif
5281 fprintf(stderr, "system bytes = %10u\n", system_b);
5282 fprintf(stderr, "in use bytes = %10u\n", in_use_b);
5283 #ifdef NO_THREADS
5284 fprintf(stderr, "max system bytes = %10u\n", (unsigned int)mp_.max_total_mem);
5285 #endif
5286 #if HAVE_MMAP
5287 fprintf(stderr, "max mmap regions = %10u\n", (unsigned int)mp_.max_n_mmaps);
5288 fprintf(stderr, "max mmap bytes = %10lu\n",
5289 (unsigned long)mp_.max_mmapped_mem);
5290 #endif
5291 #if THREAD_STATS
5292 fprintf(stderr, "heaps created = %10d\n", stat_n_heaps);
5293 fprintf(stderr, "locked directly = %10ld\n", stat_lock_direct);
5294 fprintf(stderr, "locked in loop = %10ld\n", stat_lock_loop);
5295 fprintf(stderr, "locked waiting = %10ld\n", stat_lock_wait);
5296 fprintf(stderr, "locked total = %10ld\n",
5297 stat_lock_direct + stat_lock_loop + stat_lock_wait);
5298 #endif
5299 #ifdef _LIBC
5300 ((_IO_FILE *) stderr)->_flags2 |= old_flags2;
5301 _IO_funlockfile (stderr);
5302 #endif
5307 ------------------------------ mallopt ------------------------------
5310 #if __STD_C
5311 int mALLOPt(int param_number, int value)
5312 #else
5313 int mALLOPt(param_number, value) int param_number; int value;
5314 #endif
5316 mstate av = &main_arena;
5317 int res = 1;
5319 if(__malloc_initialized < 0)
5320 ptmalloc_init ();
5321 (void)mutex_lock(&av->mutex);
5322 /* Ensure initialization/consolidation */
5323 malloc_consolidate(av);
5325 switch(param_number) {
5326 case M_MXFAST:
5327 if (value >= 0 && value <= MAX_FAST_SIZE) {
5328 set_max_fast(av, value);
5330 else
5331 res = 0;
5332 break;
5334 case M_TRIM_THRESHOLD:
5335 mp_.trim_threshold = value;
5336 break;
5338 case M_TOP_PAD:
5339 mp_.top_pad = value;
5340 break;
5342 case M_MMAP_THRESHOLD:
5343 #if USE_ARENAS
5344 /* Forbid setting the threshold too high. */
5345 if((unsigned long)value > HEAP_MAX_SIZE/2)
5346 res = 0;
5347 else
5348 #endif
5349 mp_.mmap_threshold = value;
5350 break;
5352 case M_MMAP_MAX:
5353 #if !HAVE_MMAP
5354 if (value != 0)
5355 res = 0;
5356 else
5357 #endif
5358 mp_.n_mmaps_max = value;
5359 break;
5361 case M_CHECK_ACTION:
5362 check_action = value;
5363 break;
5365 (void)mutex_unlock(&av->mutex);
5366 return res;
5371 -------------------- Alternative MORECORE functions --------------------
5376 General Requirements for MORECORE.
5378 The MORECORE function must have the following properties:
5380 If MORECORE_CONTIGUOUS is false:
5382 * MORECORE must allocate in multiples of pagesize. It will
5383 only be called with arguments that are multiples of pagesize.
5385 * MORECORE(0) must return an address that is at least
5386 MALLOC_ALIGNMENT aligned. (Page-aligning always suffices.)
5388 else (i.e. If MORECORE_CONTIGUOUS is true):
5390 * Consecutive calls to MORECORE with positive arguments
5391 return increasing addresses, indicating that space has been
5392 contiguously extended.
5394 * MORECORE need not allocate in multiples of pagesize.
5395 Calls to MORECORE need not have args of multiples of pagesize.
5397 * MORECORE need not page-align.
5399 In either case:
5401 * MORECORE may allocate more memory than requested. (Or even less,
5402 but this will generally result in a malloc failure.)
5404 * MORECORE must not allocate memory when given argument zero, but
5405 instead return one past the end address of memory from previous
5406 nonzero call. This malloc does NOT call MORECORE(0)
5407 until at least one call with positive arguments is made, so
5408 the initial value returned is not important.
5410 * Even though consecutive calls to MORECORE need not return contiguous
5411 addresses, it must be OK for malloc'ed chunks to span multiple
5412 regions in those cases where they do happen to be contiguous.
5414 * MORECORE need not handle negative arguments -- it may instead
5415 just return MORECORE_FAILURE when given negative arguments.
5416 Negative arguments are always multiples of pagesize. MORECORE
5417 must not misinterpret negative args as large positive unsigned
5418 args. You can suppress all such calls from even occurring by defining
5419 MORECORE_CANNOT_TRIM,
5421 There is some variation across systems about the type of the
5422 argument to sbrk/MORECORE. If size_t is unsigned, then it cannot
5423 actually be size_t, because sbrk supports negative args, so it is
5424 normally the signed type of the same width as size_t (sometimes
5425 declared as "intptr_t", and sometimes "ptrdiff_t"). It doesn't much
5426 matter though. Internally, we use "long" as arguments, which should
5427 work across all reasonable possibilities.
5429 Additionally, if MORECORE ever returns failure for a positive
5430 request, and HAVE_MMAP is true, then mmap is used as a noncontiguous
5431 system allocator. This is a useful backup strategy for systems with
5432 holes in address spaces -- in this case sbrk cannot contiguously
5433 expand the heap, but mmap may be able to map noncontiguous space.
5435 If you'd like mmap to ALWAYS be used, you can define MORECORE to be
5436 a function that always returns MORECORE_FAILURE.
5438 If you are using this malloc with something other than sbrk (or its
5439 emulation) to supply memory regions, you probably want to set
5440 MORECORE_CONTIGUOUS as false. As an example, here is a custom
5441 allocator kindly contributed for pre-OSX macOS. It uses virtually
5442 but not necessarily physically contiguous non-paged memory (locked
5443 in, present and won't get swapped out). You can use it by
5444 uncommenting this section, adding some #includes, and setting up the
5445 appropriate defines above:
5447 #define MORECORE osMoreCore
5448 #define MORECORE_CONTIGUOUS 0
5450 There is also a shutdown routine that should somehow be called for
5451 cleanup upon program exit.
5453 #define MAX_POOL_ENTRIES 100
5454 #define MINIMUM_MORECORE_SIZE (64 * 1024)
5455 static int next_os_pool;
5456 void *our_os_pools[MAX_POOL_ENTRIES];
5458 void *osMoreCore(int size)
5460 void *ptr = 0;
5461 static void *sbrk_top = 0;
5463 if (size > 0)
5465 if (size < MINIMUM_MORECORE_SIZE)
5466 size = MINIMUM_MORECORE_SIZE;
5467 if (CurrentExecutionLevel() == kTaskLevel)
5468 ptr = PoolAllocateResident(size + RM_PAGE_SIZE, 0);
5469 if (ptr == 0)
5471 return (void *) MORECORE_FAILURE;
5473 // save ptrs so they can be freed during cleanup
5474 our_os_pools[next_os_pool] = ptr;
5475 next_os_pool++;
5476 ptr = (void *) ((((unsigned long) ptr) + RM_PAGE_MASK) & ~RM_PAGE_MASK);
5477 sbrk_top = (char *) ptr + size;
5478 return ptr;
5480 else if (size < 0)
5482 // we don't currently support shrink behavior
5483 return (void *) MORECORE_FAILURE;
5485 else
5487 return sbrk_top;
5491 // cleanup any allocated memory pools
5492 // called as last thing before shutting down driver
5494 void osCleanupMem(void)
5496 void **ptr;
5498 for (ptr = our_os_pools; ptr < &our_os_pools[MAX_POOL_ENTRIES]; ptr++)
5499 if (*ptr)
5501 PoolDeallocate(*ptr);
5502 *ptr = 0;
5509 /* Helper code. */
5511 static void
5512 malloc_printerr(int action, const char *str, void *ptr)
5514 if (action & 1)
5516 char buf[2 * sizeof (uintptr_t) + 1];
5518 buf[sizeof (buf) - 1] = '\0';
5519 char *cp = _itoa_word ((uintptr_t) ptr, &buf[sizeof (buf) - 1], 16, 0);
5520 while (cp > buf)
5521 *--cp = '0';
5523 __libc_message (action & 2,
5524 action & 4
5525 ? "%s\n" : "*** glibc detected *** %s: 0x%s ***\n",
5526 str, cp);
5528 else if (action & 2)
5529 abort ();
5532 #ifdef _LIBC
5533 # include <sys/param.h>
5535 /* We need a wrapper function for one of the additions of POSIX. */
5537 __posix_memalign (void **memptr, size_t alignment, size_t size)
5539 void *mem;
5540 __malloc_ptr_t (*hook) __MALLOC_PMT ((size_t, size_t,
5541 __const __malloc_ptr_t)) =
5542 __memalign_hook;
5544 /* Test whether the SIZE argument is valid. It must be a power of
5545 two multiple of sizeof (void *). */
5546 if (alignment % sizeof (void *) != 0
5547 || !powerof2 (alignment / sizeof (void *)) != 0
5548 || alignment == 0)
5549 return EINVAL;
5551 /* Call the hook here, so that caller is posix_memalign's caller
5552 and not posix_memalign itself. */
5553 if (hook != NULL)
5554 mem = (*hook)(alignment, size, RETURN_ADDRESS (0));
5555 else
5556 mem = public_mEMALIGn (alignment, size);
5558 if (mem != NULL) {
5559 *memptr = mem;
5560 return 0;
5563 return ENOMEM;
5565 weak_alias (__posix_memalign, posix_memalign)
5567 strong_alias (__libc_calloc, __calloc) weak_alias (__libc_calloc, calloc)
5568 strong_alias (__libc_free, __cfree) weak_alias (__libc_free, cfree)
5569 strong_alias (__libc_free, __free) strong_alias (__libc_free, free)
5570 strong_alias (__libc_malloc, __malloc) strong_alias (__libc_malloc, malloc)
5571 strong_alias (__libc_memalign, __memalign)
5572 weak_alias (__libc_memalign, memalign)
5573 strong_alias (__libc_realloc, __realloc) strong_alias (__libc_realloc, realloc)
5574 strong_alias (__libc_valloc, __valloc) weak_alias (__libc_valloc, valloc)
5575 strong_alias (__libc_pvalloc, __pvalloc) weak_alias (__libc_pvalloc, pvalloc)
5576 strong_alias (__libc_mallinfo, __mallinfo)
5577 weak_alias (__libc_mallinfo, mallinfo)
5578 strong_alias (__libc_mallopt, __mallopt) weak_alias (__libc_mallopt, mallopt)
5580 weak_alias (__malloc_stats, malloc_stats)
5581 weak_alias (__malloc_usable_size, malloc_usable_size)
5582 weak_alias (__malloc_trim, malloc_trim)
5583 weak_alias (__malloc_get_state, malloc_get_state)
5584 weak_alias (__malloc_set_state, malloc_set_state)
5586 #endif /* _LIBC */
5588 /* ------------------------------------------------------------
5589 History:
5591 [see ftp://g.oswego.edu/pub/misc/malloc.c for the history of dlmalloc]
5595 * Local variables:
5596 * c-basic-offset: 2
5597 * End: