2005-04-27 Ulrich Drepper <drepper@redhat.com>
[glibc/history.git] / malloc / malloc.c
blob35ec8d6a569da7e2986886bf33a166838f894354
1 /* Malloc implementation for multiple threads without lock contention.
2 Copyright (C) 1996-2002, 2003, 2004 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
4 Contributed by Wolfram Gloger <wg@malloc.de>
5 and Doug Lea <dl@cs.oswego.edu>, 2001.
7 The GNU C Library is free software; you can redistribute it and/or
8 modify it under the terms of the GNU Lesser General Public License as
9 published by the Free Software Foundation; either version 2.1 of the
10 License, or (at your option) any later version.
12 The GNU C Library is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 Lesser General Public License for more details.
17 You should have received a copy of the GNU Lesser General Public
18 License along with the GNU C Library; see the file COPYING.LIB. If not,
19 write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
20 Boston, MA 02111-1307, USA. */
23 This is a version (aka ptmalloc2) of malloc/free/realloc written by
24 Doug Lea and adapted to multiple threads/arenas by Wolfram Gloger.
26 * Version ptmalloc2-20011215
27 $Id$
28 based on:
29 VERSION 2.7.0 Sun Mar 11 14:14:06 2001 Doug Lea (dl at gee)
31 Note: There may be an updated version of this malloc obtainable at
32 http://www.malloc.de/malloc/ptmalloc2.tar.gz
33 Check before installing!
35 * Quickstart
37 In order to compile this implementation, a Makefile is provided with
38 the ptmalloc2 distribution, which has pre-defined targets for some
39 popular systems (e.g. "make posix" for Posix threads). All that is
40 typically required with regard to compiler flags is the selection of
41 the thread package via defining one out of USE_PTHREADS, USE_THR or
42 USE_SPROC. Check the thread-m.h file for what effects this has.
43 Many/most systems will additionally require USE_TSD_DATA_HACK to be
44 defined, so this is the default for "make posix".
46 * Why use this malloc?
48 This is not the fastest, most space-conserving, most portable, or
49 most tunable malloc ever written. However it is among the fastest
50 while also being among the most space-conserving, portable and tunable.
51 Consistent balance across these factors results in a good general-purpose
52 allocator for malloc-intensive programs.
54 The main properties of the algorithms are:
55 * For large (>= 512 bytes) requests, it is a pure best-fit allocator,
56 with ties normally decided via FIFO (i.e. least recently used).
57 * For small (<= 64 bytes by default) requests, it is a caching
58 allocator, that maintains pools of quickly recycled chunks.
59 * In between, and for combinations of large and small requests, it does
60 the best it can trying to meet both goals at once.
61 * For very large requests (>= 128KB by default), it relies on system
62 memory mapping facilities, if supported.
64 For a longer but slightly out of date high-level description, see
65 http://gee.cs.oswego.edu/dl/html/malloc.html
67 You may already by default be using a C library containing a malloc
68 that is based on some version of this malloc (for example in
69 linux). You might still want to use the one in this file in order to
70 customize settings or to avoid overheads associated with library
71 versions.
73 * Contents, described in more detail in "description of public routines" below.
75 Standard (ANSI/SVID/...) functions:
76 malloc(size_t n);
77 calloc(size_t n_elements, size_t element_size);
78 free(Void_t* p);
79 realloc(Void_t* p, size_t n);
80 memalign(size_t alignment, size_t n);
81 valloc(size_t n);
82 mallinfo()
83 mallopt(int parameter_number, int parameter_value)
85 Additional functions:
86 independent_calloc(size_t n_elements, size_t size, Void_t* chunks[]);
87 independent_comalloc(size_t n_elements, size_t sizes[], Void_t* chunks[]);
88 pvalloc(size_t n);
89 cfree(Void_t* p);
90 malloc_trim(size_t pad);
91 malloc_usable_size(Void_t* p);
92 malloc_stats();
94 * Vital statistics:
96 Supported pointer representation: 4 or 8 bytes
97 Supported size_t representation: 4 or 8 bytes
98 Note that size_t is allowed to be 4 bytes even if pointers are 8.
99 You can adjust this by defining INTERNAL_SIZE_T
101 Alignment: 2 * sizeof(size_t) (default)
102 (i.e., 8 byte alignment with 4byte size_t). This suffices for
103 nearly all current machines and C compilers. However, you can
104 define MALLOC_ALIGNMENT to be wider than this if necessary.
106 Minimum overhead per allocated chunk: 4 or 8 bytes
107 Each malloced chunk has a hidden word of overhead holding size
108 and status information.
110 Minimum allocated size: 4-byte ptrs: 16 bytes (including 4 overhead)
111 8-byte ptrs: 24/32 bytes (including, 4/8 overhead)
113 When a chunk is freed, 12 (for 4byte ptrs) or 20 (for 8 byte
114 ptrs but 4 byte size) or 24 (for 8/8) additional bytes are
115 needed; 4 (8) for a trailing size field and 8 (16) bytes for
116 free list pointers. Thus, the minimum allocatable size is
117 16/24/32 bytes.
119 Even a request for zero bytes (i.e., malloc(0)) returns a
120 pointer to something of the minimum allocatable size.
122 The maximum overhead wastage (i.e., number of extra bytes
123 allocated than were requested in malloc) is less than or equal
124 to the minimum size, except for requests >= mmap_threshold that
125 are serviced via mmap(), where the worst case wastage is 2 *
126 sizeof(size_t) bytes plus the remainder from a system page (the
127 minimal mmap unit); typically 4096 or 8192 bytes.
129 Maximum allocated size: 4-byte size_t: 2^32 minus about two pages
130 8-byte size_t: 2^64 minus about two pages
132 It is assumed that (possibly signed) size_t values suffice to
133 represent chunk sizes. `Possibly signed' is due to the fact
134 that `size_t' may be defined on a system as either a signed or
135 an unsigned type. The ISO C standard says that it must be
136 unsigned, but a few systems are known not to adhere to this.
137 Additionally, even when size_t is unsigned, sbrk (which is by
138 default used to obtain memory from system) accepts signed
139 arguments, and may not be able to handle size_t-wide arguments
140 with negative sign bit. Generally, values that would
141 appear as negative after accounting for overhead and alignment
142 are supported only via mmap(), which does not have this
143 limitation.
145 Requests for sizes outside the allowed range will perform an optional
146 failure action and then return null. (Requests may also
147 also fail because a system is out of memory.)
149 Thread-safety: thread-safe unless NO_THREADS is defined
151 Compliance: I believe it is compliant with the 1997 Single Unix Specification
152 (See http://www.opennc.org). Also SVID/XPG, ANSI C, and probably
153 others as well.
155 * Synopsis of compile-time options:
157 People have reported using previous versions of this malloc on all
158 versions of Unix, sometimes by tweaking some of the defines
159 below. It has been tested most extensively on Solaris and
160 Linux. It is also reported to work on WIN32 platforms.
161 People also report using it in stand-alone embedded systems.
163 The implementation is in straight, hand-tuned ANSI C. It is not
164 at all modular. (Sorry!) It uses a lot of macros. To be at all
165 usable, this code should be compiled using an optimizing compiler
166 (for example gcc -O3) that can simplify expressions and control
167 paths. (FAQ: some macros import variables as arguments rather than
168 declare locals because people reported that some debuggers
169 otherwise get confused.)
171 OPTION DEFAULT VALUE
173 Compilation Environment options:
175 __STD_C derived from C compiler defines
176 WIN32 NOT defined
177 HAVE_MEMCPY defined
178 USE_MEMCPY 1 if HAVE_MEMCPY is defined
179 HAVE_MMAP defined as 1
180 MMAP_CLEARS 1
181 HAVE_MREMAP 0 unless linux defined
182 USE_ARENAS the same as HAVE_MMAP
183 malloc_getpagesize derived from system #includes, or 4096 if not
184 HAVE_USR_INCLUDE_MALLOC_H NOT defined
185 LACKS_UNISTD_H NOT defined unless WIN32
186 LACKS_SYS_PARAM_H NOT defined unless WIN32
187 LACKS_SYS_MMAN_H NOT defined unless WIN32
189 Changing default word sizes:
191 INTERNAL_SIZE_T size_t
192 MALLOC_ALIGNMENT 2 * sizeof(INTERNAL_SIZE_T)
194 Configuration and functionality options:
196 USE_DL_PREFIX NOT defined
197 USE_PUBLIC_MALLOC_WRAPPERS NOT defined
198 USE_MALLOC_LOCK NOT defined
199 MALLOC_DEBUG NOT defined
200 REALLOC_ZERO_BYTES_FREES 1
201 MALLOC_FAILURE_ACTION errno = ENOMEM, if __STD_C defined, else no-op
202 TRIM_FASTBINS 0
204 Options for customizing MORECORE:
206 MORECORE sbrk
207 MORECORE_FAILURE -1
208 MORECORE_CONTIGUOUS 1
209 MORECORE_CANNOT_TRIM NOT defined
210 MORECORE_CLEARS 1
211 MMAP_AS_MORECORE_SIZE (1024 * 1024)
213 Tuning options that are also dynamically changeable via mallopt:
215 DEFAULT_MXFAST 64
216 DEFAULT_TRIM_THRESHOLD 128 * 1024
217 DEFAULT_TOP_PAD 0
218 DEFAULT_MMAP_THRESHOLD 128 * 1024
219 DEFAULT_MMAP_MAX 65536
221 There are several other #defined constants and macros that you
222 probably don't want to touch unless you are extending or adapting malloc. */
225 __STD_C should be nonzero if using ANSI-standard C compiler, a C++
226 compiler, or a C compiler sufficiently close to ANSI to get away
227 with it.
230 #ifndef __STD_C
231 #if defined(__STDC__) || defined(__cplusplus)
232 #define __STD_C 1
233 #else
234 #define __STD_C 0
235 #endif
236 #endif /*__STD_C*/
240 Void_t* is the pointer type that malloc should say it returns
243 #ifndef Void_t
244 #if (__STD_C || defined(WIN32))
245 #define Void_t void
246 #else
247 #define Void_t char
248 #endif
249 #endif /*Void_t*/
251 #if __STD_C
252 #include <stddef.h> /* for size_t */
253 #include <stdlib.h> /* for getenv(), abort() */
254 #else
255 #include <sys/types.h>
256 #endif
258 #include <malloc-machine.h>
260 #ifdef _LIBC
261 #include <stdio-common/_itoa.h>
262 #endif
264 #ifdef __cplusplus
265 extern "C" {
266 #endif
268 /* define LACKS_UNISTD_H if your system does not have a <unistd.h>. */
270 /* #define LACKS_UNISTD_H */
272 #ifndef LACKS_UNISTD_H
273 #include <unistd.h>
274 #endif
276 /* define LACKS_SYS_PARAM_H if your system does not have a <sys/param.h>. */
278 /* #define LACKS_SYS_PARAM_H */
281 #include <stdio.h> /* needed for malloc_stats */
282 #include <errno.h> /* needed for optional MALLOC_FAILURE_ACTION */
284 /* For uintptr_t. */
285 #include <stdint.h>
287 /* For va_arg, va_start, va_end. */
288 #include <stdarg.h>
290 /* For writev and struct iovec. */
291 #include <sys/uio.h>
292 /* For syslog. */
293 #include <sys/syslog.h>
295 /* For various dynamic linking things. */
296 #include <dlfcn.h>
300 Debugging:
302 Because freed chunks may be overwritten with bookkeeping fields, this
303 malloc will often die when freed memory is overwritten by user
304 programs. This can be very effective (albeit in an annoying way)
305 in helping track down dangling pointers.
307 If you compile with -DMALLOC_DEBUG, a number of assertion checks are
308 enabled that will catch more memory errors. You probably won't be
309 able to make much sense of the actual assertion errors, but they
310 should help you locate incorrectly overwritten memory. The checking
311 is fairly extensive, and will slow down execution
312 noticeably. Calling malloc_stats or mallinfo with MALLOC_DEBUG set
313 will attempt to check every non-mmapped allocated and free chunk in
314 the course of computing the summmaries. (By nature, mmapped regions
315 cannot be checked very much automatically.)
317 Setting MALLOC_DEBUG may also be helpful if you are trying to modify
318 this code. The assertions in the check routines spell out in more
319 detail the assumptions and invariants underlying the algorithms.
321 Setting MALLOC_DEBUG does NOT provide an automated mechanism for
322 checking that all accesses to malloced memory stay within their
323 bounds. However, there are several add-ons and adaptations of this
324 or other mallocs available that do this.
327 #if MALLOC_DEBUG
328 #include <assert.h>
329 #else
330 #undef assert
331 #define assert(x) ((void)0)
332 #endif
336 INTERNAL_SIZE_T is the word-size used for internal bookkeeping
337 of chunk sizes.
339 The default version is the same as size_t.
341 While not strictly necessary, it is best to define this as an
342 unsigned type, even if size_t is a signed type. This may avoid some
343 artificial size limitations on some systems.
345 On a 64-bit machine, you may be able to reduce malloc overhead by
346 defining INTERNAL_SIZE_T to be a 32 bit `unsigned int' at the
347 expense of not being able to handle more than 2^32 of malloced
348 space. If this limitation is acceptable, you are encouraged to set
349 this unless you are on a platform requiring 16byte alignments. In
350 this case the alignment requirements turn out to negate any
351 potential advantages of decreasing size_t word size.
353 Implementors: Beware of the possible combinations of:
354 - INTERNAL_SIZE_T might be signed or unsigned, might be 32 or 64 bits,
355 and might be the same width as int or as long
356 - size_t might have different width and signedness as INTERNAL_SIZE_T
357 - int and long might be 32 or 64 bits, and might be the same width
358 To deal with this, most comparisons and difference computations
359 among INTERNAL_SIZE_Ts should cast them to unsigned long, being
360 aware of the fact that casting an unsigned int to a wider long does
361 not sign-extend. (This also makes checking for negative numbers
362 awkward.) Some of these casts result in harmless compiler warnings
363 on some systems.
366 #ifndef INTERNAL_SIZE_T
367 #define INTERNAL_SIZE_T size_t
368 #endif
370 /* The corresponding word size */
371 #define SIZE_SZ (sizeof(INTERNAL_SIZE_T))
375 MALLOC_ALIGNMENT is the minimum alignment for malloc'ed chunks.
376 It must be a power of two at least 2 * SIZE_SZ, even on machines
377 for which smaller alignments would suffice. It may be defined as
378 larger than this though. Note however that code and data structures
379 are optimized for the case of 8-byte alignment.
383 #ifndef MALLOC_ALIGNMENT
384 #define MALLOC_ALIGNMENT (2 * SIZE_SZ)
385 #endif
387 /* The corresponding bit mask value */
388 #define MALLOC_ALIGN_MASK (MALLOC_ALIGNMENT - 1)
393 REALLOC_ZERO_BYTES_FREES should be set if a call to
394 realloc with zero bytes should be the same as a call to free.
395 This is required by the C standard. Otherwise, since this malloc
396 returns a unique pointer for malloc(0), so does realloc(p, 0).
399 #ifndef REALLOC_ZERO_BYTES_FREES
400 #define REALLOC_ZERO_BYTES_FREES 1
401 #endif
404 TRIM_FASTBINS controls whether free() of a very small chunk can
405 immediately lead to trimming. Setting to true (1) can reduce memory
406 footprint, but will almost always slow down programs that use a lot
407 of small chunks.
409 Define this only if you are willing to give up some speed to more
410 aggressively reduce system-level memory footprint when releasing
411 memory in programs that use many small chunks. You can get
412 essentially the same effect by setting MXFAST to 0, but this can
413 lead to even greater slowdowns in programs using many small chunks.
414 TRIM_FASTBINS is an in-between compile-time option, that disables
415 only those chunks bordering topmost memory from being placed in
416 fastbins.
419 #ifndef TRIM_FASTBINS
420 #define TRIM_FASTBINS 0
421 #endif
425 USE_DL_PREFIX will prefix all public routines with the string 'dl'.
426 This is necessary when you only want to use this malloc in one part
427 of a program, using your regular system malloc elsewhere.
430 /* #define USE_DL_PREFIX */
434 Two-phase name translation.
435 All of the actual routines are given mangled names.
436 When wrappers are used, they become the public callable versions.
437 When DL_PREFIX is used, the callable names are prefixed.
440 #ifdef USE_DL_PREFIX
441 #define public_cALLOc dlcalloc
442 #define public_fREe dlfree
443 #define public_cFREe dlcfree
444 #define public_mALLOc dlmalloc
445 #define public_mEMALIGn dlmemalign
446 #define public_rEALLOc dlrealloc
447 #define public_vALLOc dlvalloc
448 #define public_pVALLOc dlpvalloc
449 #define public_mALLINFo dlmallinfo
450 #define public_mALLOPt dlmallopt
451 #define public_mTRIm dlmalloc_trim
452 #define public_mSTATs dlmalloc_stats
453 #define public_mUSABLe dlmalloc_usable_size
454 #define public_iCALLOc dlindependent_calloc
455 #define public_iCOMALLOc dlindependent_comalloc
456 #define public_gET_STATe dlget_state
457 #define public_sET_STATe dlset_state
458 #else /* USE_DL_PREFIX */
459 #ifdef _LIBC
461 /* Special defines for the GNU C library. */
462 #define public_cALLOc __libc_calloc
463 #define public_fREe __libc_free
464 #define public_cFREe __libc_cfree
465 #define public_mALLOc __libc_malloc
466 #define public_mEMALIGn __libc_memalign
467 #define public_rEALLOc __libc_realloc
468 #define public_vALLOc __libc_valloc
469 #define public_pVALLOc __libc_pvalloc
470 #define public_mALLINFo __libc_mallinfo
471 #define public_mALLOPt __libc_mallopt
472 #define public_mTRIm __malloc_trim
473 #define public_mSTATs __malloc_stats
474 #define public_mUSABLe __malloc_usable_size
475 #define public_iCALLOc __libc_independent_calloc
476 #define public_iCOMALLOc __libc_independent_comalloc
477 #define public_gET_STATe __malloc_get_state
478 #define public_sET_STATe __malloc_set_state
479 #define malloc_getpagesize __getpagesize()
480 #define open __open
481 #define mmap __mmap
482 #define munmap __munmap
483 #define mremap __mremap
484 #define mprotect __mprotect
485 #define MORECORE (*__morecore)
486 #define MORECORE_FAILURE 0
488 Void_t * __default_morecore (ptrdiff_t);
489 Void_t *(*__morecore)(ptrdiff_t) = __default_morecore;
491 #else /* !_LIBC */
492 #define public_cALLOc calloc
493 #define public_fREe free
494 #define public_cFREe cfree
495 #define public_mALLOc malloc
496 #define public_mEMALIGn memalign
497 #define public_rEALLOc realloc
498 #define public_vALLOc valloc
499 #define public_pVALLOc pvalloc
500 #define public_mALLINFo mallinfo
501 #define public_mALLOPt mallopt
502 #define public_mTRIm malloc_trim
503 #define public_mSTATs malloc_stats
504 #define public_mUSABLe malloc_usable_size
505 #define public_iCALLOc independent_calloc
506 #define public_iCOMALLOc independent_comalloc
507 #define public_gET_STATe malloc_get_state
508 #define public_sET_STATe malloc_set_state
509 #endif /* _LIBC */
510 #endif /* USE_DL_PREFIX */
512 #ifndef _LIBC
513 #define __builtin_expect(expr, val) (expr)
515 #define fwrite(buf, size, count, fp) _IO_fwrite (buf, size, count, fp)
516 #endif
519 HAVE_MEMCPY should be defined if you are not otherwise using
520 ANSI STD C, but still have memcpy and memset in your C library
521 and want to use them in calloc and realloc. Otherwise simple
522 macro versions are defined below.
524 USE_MEMCPY should be defined as 1 if you actually want to
525 have memset and memcpy called. People report that the macro
526 versions are faster than libc versions on some systems.
528 Even if USE_MEMCPY is set to 1, loops to copy/clear small chunks
529 (of <= 36 bytes) are manually unrolled in realloc and calloc.
532 #define HAVE_MEMCPY
534 #ifndef USE_MEMCPY
535 #ifdef HAVE_MEMCPY
536 #define USE_MEMCPY 1
537 #else
538 #define USE_MEMCPY 0
539 #endif
540 #endif
543 #if (__STD_C || defined(HAVE_MEMCPY))
545 #ifdef _LIBC
546 # include <string.h>
547 #else
548 #ifdef WIN32
549 /* On Win32 memset and memcpy are already declared in windows.h */
550 #else
551 #if __STD_C
552 void* memset(void*, int, size_t);
553 void* memcpy(void*, const void*, size_t);
554 #else
555 Void_t* memset();
556 Void_t* memcpy();
557 #endif
558 #endif
559 #endif
560 #endif
563 MALLOC_FAILURE_ACTION is the action to take before "return 0" when
564 malloc fails to be able to return memory, either because memory is
565 exhausted or because of illegal arguments.
567 By default, sets errno if running on STD_C platform, else does nothing.
570 #ifndef MALLOC_FAILURE_ACTION
571 #if __STD_C
572 #define MALLOC_FAILURE_ACTION \
573 errno = ENOMEM;
575 #else
576 #define MALLOC_FAILURE_ACTION
577 #endif
578 #endif
581 MORECORE-related declarations. By default, rely on sbrk
585 #ifdef LACKS_UNISTD_H
586 #if !defined(__FreeBSD__) && !defined(__OpenBSD__) && !defined(__NetBSD__)
587 #if __STD_C
588 extern Void_t* sbrk(ptrdiff_t);
589 #else
590 extern Void_t* sbrk();
591 #endif
592 #endif
593 #endif
596 MORECORE is the name of the routine to call to obtain more memory
597 from the system. See below for general guidance on writing
598 alternative MORECORE functions, as well as a version for WIN32 and a
599 sample version for pre-OSX macos.
602 #ifndef MORECORE
603 #define MORECORE sbrk
604 #endif
607 MORECORE_FAILURE is the value returned upon failure of MORECORE
608 as well as mmap. Since it cannot be an otherwise valid memory address,
609 and must reflect values of standard sys calls, you probably ought not
610 try to redefine it.
613 #ifndef MORECORE_FAILURE
614 #define MORECORE_FAILURE (-1)
615 #endif
618 If MORECORE_CONTIGUOUS is true, take advantage of fact that
619 consecutive calls to MORECORE with positive arguments always return
620 contiguous increasing addresses. This is true of unix sbrk. Even
621 if not defined, when regions happen to be contiguous, malloc will
622 permit allocations spanning regions obtained from different
623 calls. But defining this when applicable enables some stronger
624 consistency checks and space efficiencies.
627 #ifndef MORECORE_CONTIGUOUS
628 #define MORECORE_CONTIGUOUS 1
629 #endif
632 Define MORECORE_CANNOT_TRIM if your version of MORECORE
633 cannot release space back to the system when given negative
634 arguments. This is generally necessary only if you are using
635 a hand-crafted MORECORE function that cannot handle negative arguments.
638 /* #define MORECORE_CANNOT_TRIM */
640 /* MORECORE_CLEARS (default 1)
641 The degree to which the routine mapped to MORECORE zeroes out
642 memory: never (0), only for newly allocated space (1) or always
643 (2). The distinction between (1) and (2) is necessary because on
644 some systems, if the application first decrements and then
645 increments the break value, the contents of the reallocated space
646 are unspecified.
649 #ifndef MORECORE_CLEARS
650 #define MORECORE_CLEARS 1
651 #endif
655 Define HAVE_MMAP as true to optionally make malloc() use mmap() to
656 allocate very large blocks. These will be returned to the
657 operating system immediately after a free(). Also, if mmap
658 is available, it is used as a backup strategy in cases where
659 MORECORE fails to provide space from system.
661 This malloc is best tuned to work with mmap for large requests.
662 If you do not have mmap, operations involving very large chunks (1MB
663 or so) may be slower than you'd like.
666 #ifndef HAVE_MMAP
667 #define HAVE_MMAP 1
670 Standard unix mmap using /dev/zero clears memory so calloc doesn't
671 need to.
674 #ifndef MMAP_CLEARS
675 #define MMAP_CLEARS 1
676 #endif
678 #else /* no mmap */
679 #ifndef MMAP_CLEARS
680 #define MMAP_CLEARS 0
681 #endif
682 #endif
686 MMAP_AS_MORECORE_SIZE is the minimum mmap size argument to use if
687 sbrk fails, and mmap is used as a backup (which is done only if
688 HAVE_MMAP). The value must be a multiple of page size. This
689 backup strategy generally applies only when systems have "holes" in
690 address space, so sbrk cannot perform contiguous expansion, but
691 there is still space available on system. On systems for which
692 this is known to be useful (i.e. most linux kernels), this occurs
693 only when programs allocate huge amounts of memory. Between this,
694 and the fact that mmap regions tend to be limited, the size should
695 be large, to avoid too many mmap calls and thus avoid running out
696 of kernel resources.
699 #ifndef MMAP_AS_MORECORE_SIZE
700 #define MMAP_AS_MORECORE_SIZE (1024 * 1024)
701 #endif
704 Define HAVE_MREMAP to make realloc() use mremap() to re-allocate
705 large blocks. This is currently only possible on Linux with
706 kernel versions newer than 1.3.77.
709 #ifndef HAVE_MREMAP
710 #ifdef linux
711 #define HAVE_MREMAP 1
712 #else
713 #define HAVE_MREMAP 0
714 #endif
716 #endif /* HAVE_MMAP */
718 /* Define USE_ARENAS to enable support for multiple `arenas'. These
719 are allocated using mmap(), are necessary for threads and
720 occasionally useful to overcome address space limitations affecting
721 sbrk(). */
723 #ifndef USE_ARENAS
724 #define USE_ARENAS HAVE_MMAP
725 #endif
729 The system page size. To the extent possible, this malloc manages
730 memory from the system in page-size units. Note that this value is
731 cached during initialization into a field of malloc_state. So even
732 if malloc_getpagesize is a function, it is only called once.
734 The following mechanics for getpagesize were adapted from bsd/gnu
735 getpagesize.h. If none of the system-probes here apply, a value of
736 4096 is used, which should be OK: If they don't apply, then using
737 the actual value probably doesn't impact performance.
741 #ifndef malloc_getpagesize
743 #ifndef LACKS_UNISTD_H
744 # include <unistd.h>
745 #endif
747 # ifdef _SC_PAGESIZE /* some SVR4 systems omit an underscore */
748 # ifndef _SC_PAGE_SIZE
749 # define _SC_PAGE_SIZE _SC_PAGESIZE
750 # endif
751 # endif
753 # ifdef _SC_PAGE_SIZE
754 # define malloc_getpagesize sysconf(_SC_PAGE_SIZE)
755 # else
756 # if defined(BSD) || defined(DGUX) || defined(HAVE_GETPAGESIZE)
757 extern size_t getpagesize();
758 # define malloc_getpagesize getpagesize()
759 # else
760 # ifdef WIN32 /* use supplied emulation of getpagesize */
761 # define malloc_getpagesize getpagesize()
762 # else
763 # ifndef LACKS_SYS_PARAM_H
764 # include <sys/param.h>
765 # endif
766 # ifdef EXEC_PAGESIZE
767 # define malloc_getpagesize EXEC_PAGESIZE
768 # else
769 # ifdef NBPG
770 # ifndef CLSIZE
771 # define malloc_getpagesize NBPG
772 # else
773 # define malloc_getpagesize (NBPG * CLSIZE)
774 # endif
775 # else
776 # ifdef NBPC
777 # define malloc_getpagesize NBPC
778 # else
779 # ifdef PAGESIZE
780 # define malloc_getpagesize PAGESIZE
781 # else /* just guess */
782 # define malloc_getpagesize (4096)
783 # endif
784 # endif
785 # endif
786 # endif
787 # endif
788 # endif
789 # endif
790 #endif
793 This version of malloc supports the standard SVID/XPG mallinfo
794 routine that returns a struct containing usage properties and
795 statistics. It should work on any SVID/XPG compliant system that has
796 a /usr/include/malloc.h defining struct mallinfo. (If you'd like to
797 install such a thing yourself, cut out the preliminary declarations
798 as described above and below and save them in a malloc.h file. But
799 there's no compelling reason to bother to do this.)
801 The main declaration needed is the mallinfo struct that is returned
802 (by-copy) by mallinfo(). The SVID/XPG malloinfo struct contains a
803 bunch of fields that are not even meaningful in this version of
804 malloc. These fields are are instead filled by mallinfo() with
805 other numbers that might be of interest.
807 HAVE_USR_INCLUDE_MALLOC_H should be set if you have a
808 /usr/include/malloc.h file that includes a declaration of struct
809 mallinfo. If so, it is included; else an SVID2/XPG2 compliant
810 version is declared below. These must be precisely the same for
811 mallinfo() to work. The original SVID version of this struct,
812 defined on most systems with mallinfo, declares all fields as
813 ints. But some others define as unsigned long. If your system
814 defines the fields using a type of different width than listed here,
815 you must #include your system version and #define
816 HAVE_USR_INCLUDE_MALLOC_H.
819 /* #define HAVE_USR_INCLUDE_MALLOC_H */
821 #ifdef HAVE_USR_INCLUDE_MALLOC_H
822 #include "/usr/include/malloc.h"
823 #endif
826 /* ---------- description of public routines ------------ */
829 malloc(size_t n)
830 Returns a pointer to a newly allocated chunk of at least n bytes, or null
831 if no space is available. Additionally, on failure, errno is
832 set to ENOMEM on ANSI C systems.
834 If n is zero, malloc returns a minumum-sized chunk. (The minimum
835 size is 16 bytes on most 32bit systems, and 24 or 32 bytes on 64bit
836 systems.) On most systems, size_t is an unsigned type, so calls
837 with negative arguments are interpreted as requests for huge amounts
838 of space, which will often fail. The maximum supported value of n
839 differs across systems, but is in all cases less than the maximum
840 representable value of a size_t.
842 #if __STD_C
843 Void_t* public_mALLOc(size_t);
844 #else
845 Void_t* public_mALLOc();
846 #endif
847 #ifdef libc_hidden_proto
848 libc_hidden_proto (public_mALLOc)
849 #endif
852 free(Void_t* p)
853 Releases the chunk of memory pointed to by p, that had been previously
854 allocated using malloc or a related routine such as realloc.
855 It has no effect if p is null. It can have arbitrary (i.e., bad!)
856 effects if p has already been freed.
858 Unless disabled (using mallopt), freeing very large spaces will
859 when possible, automatically trigger operations that give
860 back unused memory to the system, thus reducing program footprint.
862 #if __STD_C
863 void public_fREe(Void_t*);
864 #else
865 void public_fREe();
866 #endif
867 #ifdef libc_hidden_proto
868 libc_hidden_proto (public_fREe)
869 #endif
872 calloc(size_t n_elements, size_t element_size);
873 Returns a pointer to n_elements * element_size bytes, with all locations
874 set to zero.
876 #if __STD_C
877 Void_t* public_cALLOc(size_t, size_t);
878 #else
879 Void_t* public_cALLOc();
880 #endif
883 realloc(Void_t* p, size_t n)
884 Returns a pointer to a chunk of size n that contains the same data
885 as does chunk p up to the minimum of (n, p's size) bytes, or null
886 if no space is available.
888 The returned pointer may or may not be the same as p. The algorithm
889 prefers extending p when possible, otherwise it employs the
890 equivalent of a malloc-copy-free sequence.
892 If p is null, realloc is equivalent to malloc.
894 If space is not available, realloc returns null, errno is set (if on
895 ANSI) and p is NOT freed.
897 if n is for fewer bytes than already held by p, the newly unused
898 space is lopped off and freed if possible. Unless the #define
899 REALLOC_ZERO_BYTES_FREES is set, realloc with a size argument of
900 zero (re)allocates a minimum-sized chunk.
902 Large chunks that were internally obtained via mmap will always
903 be reallocated using malloc-copy-free sequences unless
904 the system supports MREMAP (currently only linux).
906 The old unix realloc convention of allowing the last-free'd chunk
907 to be used as an argument to realloc is not supported.
909 #if __STD_C
910 Void_t* public_rEALLOc(Void_t*, size_t);
911 #else
912 Void_t* public_rEALLOc();
913 #endif
914 #ifdef libc_hidden_proto
915 libc_hidden_proto (public_rEALLOc)
916 #endif
919 memalign(size_t alignment, size_t n);
920 Returns a pointer to a newly allocated chunk of n bytes, aligned
921 in accord with the alignment argument.
923 The alignment argument should be a power of two. If the argument is
924 not a power of two, the nearest greater power is used.
925 8-byte alignment is guaranteed by normal malloc calls, so don't
926 bother calling memalign with an argument of 8 or less.
928 Overreliance on memalign is a sure way to fragment space.
930 #if __STD_C
931 Void_t* public_mEMALIGn(size_t, size_t);
932 #else
933 Void_t* public_mEMALIGn();
934 #endif
935 #ifdef libc_hidden_proto
936 libc_hidden_proto (public_mEMALIGn)
937 #endif
940 valloc(size_t n);
941 Equivalent to memalign(pagesize, n), where pagesize is the page
942 size of the system. If the pagesize is unknown, 4096 is used.
944 #if __STD_C
945 Void_t* public_vALLOc(size_t);
946 #else
947 Void_t* public_vALLOc();
948 #endif
953 mallopt(int parameter_number, int parameter_value)
954 Sets tunable parameters The format is to provide a
955 (parameter-number, parameter-value) pair. mallopt then sets the
956 corresponding parameter to the argument value if it can (i.e., so
957 long as the value is meaningful), and returns 1 if successful else
958 0. SVID/XPG/ANSI defines four standard param numbers for mallopt,
959 normally defined in malloc.h. Only one of these (M_MXFAST) is used
960 in this malloc. The others (M_NLBLKS, M_GRAIN, M_KEEP) don't apply,
961 so setting them has no effect. But this malloc also supports four
962 other options in mallopt. See below for details. Briefly, supported
963 parameters are as follows (listed defaults are for "typical"
964 configurations).
966 Symbol param # default allowed param values
967 M_MXFAST 1 64 0-80 (0 disables fastbins)
968 M_TRIM_THRESHOLD -1 128*1024 any (-1U disables trimming)
969 M_TOP_PAD -2 0 any
970 M_MMAP_THRESHOLD -3 128*1024 any (or 0 if no MMAP support)
971 M_MMAP_MAX -4 65536 any (0 disables use of mmap)
973 #if __STD_C
974 int public_mALLOPt(int, int);
975 #else
976 int public_mALLOPt();
977 #endif
981 mallinfo()
982 Returns (by copy) a struct containing various summary statistics:
984 arena: current total non-mmapped bytes allocated from system
985 ordblks: the number of free chunks
986 smblks: the number of fastbin blocks (i.e., small chunks that
987 have been freed but not use resused or consolidated)
988 hblks: current number of mmapped regions
989 hblkhd: total bytes held in mmapped regions
990 usmblks: the maximum total allocated space. This will be greater
991 than current total if trimming has occurred.
992 fsmblks: total bytes held in fastbin blocks
993 uordblks: current total allocated space (normal or mmapped)
994 fordblks: total free space
995 keepcost: the maximum number of bytes that could ideally be released
996 back to system via malloc_trim. ("ideally" means that
997 it ignores page restrictions etc.)
999 Because these fields are ints, but internal bookkeeping may
1000 be kept as longs, the reported values may wrap around zero and
1001 thus be inaccurate.
1003 #if __STD_C
1004 struct mallinfo public_mALLINFo(void);
1005 #else
1006 struct mallinfo public_mALLINFo();
1007 #endif
1010 independent_calloc(size_t n_elements, size_t element_size, Void_t* chunks[]);
1012 independent_calloc is similar to calloc, but instead of returning a
1013 single cleared space, it returns an array of pointers to n_elements
1014 independent elements that can hold contents of size elem_size, each
1015 of which starts out cleared, and can be independently freed,
1016 realloc'ed etc. The elements are guaranteed to be adjacently
1017 allocated (this is not guaranteed to occur with multiple callocs or
1018 mallocs), which may also improve cache locality in some
1019 applications.
1021 The "chunks" argument is optional (i.e., may be null, which is
1022 probably the most typical usage). If it is null, the returned array
1023 is itself dynamically allocated and should also be freed when it is
1024 no longer needed. Otherwise, the chunks array must be of at least
1025 n_elements in length. It is filled in with the pointers to the
1026 chunks.
1028 In either case, independent_calloc returns this pointer array, or
1029 null if the allocation failed. If n_elements is zero and "chunks"
1030 is null, it returns a chunk representing an array with zero elements
1031 (which should be freed if not wanted).
1033 Each element must be individually freed when it is no longer
1034 needed. If you'd like to instead be able to free all at once, you
1035 should instead use regular calloc and assign pointers into this
1036 space to represent elements. (In this case though, you cannot
1037 independently free elements.)
1039 independent_calloc simplifies and speeds up implementations of many
1040 kinds of pools. It may also be useful when constructing large data
1041 structures that initially have a fixed number of fixed-sized nodes,
1042 but the number is not known at compile time, and some of the nodes
1043 may later need to be freed. For example:
1045 struct Node { int item; struct Node* next; };
1047 struct Node* build_list() {
1048 struct Node** pool;
1049 int n = read_number_of_nodes_needed();
1050 if (n <= 0) return 0;
1051 pool = (struct Node**)(independent_calloc(n, sizeof(struct Node), 0);
1052 if (pool == 0) die();
1053 // organize into a linked list...
1054 struct Node* first = pool[0];
1055 for (i = 0; i < n-1; ++i)
1056 pool[i]->next = pool[i+1];
1057 free(pool); // Can now free the array (or not, if it is needed later)
1058 return first;
1061 #if __STD_C
1062 Void_t** public_iCALLOc(size_t, size_t, Void_t**);
1063 #else
1064 Void_t** public_iCALLOc();
1065 #endif
1068 independent_comalloc(size_t n_elements, size_t sizes[], Void_t* chunks[]);
1070 independent_comalloc allocates, all at once, a set of n_elements
1071 chunks with sizes indicated in the "sizes" array. It returns
1072 an array of pointers to these elements, each of which can be
1073 independently freed, realloc'ed etc. The elements are guaranteed to
1074 be adjacently allocated (this is not guaranteed to occur with
1075 multiple callocs or mallocs), which may also improve cache locality
1076 in some applications.
1078 The "chunks" argument is optional (i.e., may be null). If it is null
1079 the returned array is itself dynamically allocated and should also
1080 be freed when it is no longer needed. Otherwise, the chunks array
1081 must be of at least n_elements in length. It is filled in with the
1082 pointers to the chunks.
1084 In either case, independent_comalloc returns this pointer array, or
1085 null if the allocation failed. If n_elements is zero and chunks is
1086 null, it returns a chunk representing an array with zero elements
1087 (which should be freed if not wanted).
1089 Each element must be individually freed when it is no longer
1090 needed. If you'd like to instead be able to free all at once, you
1091 should instead use a single regular malloc, and assign pointers at
1092 particular offsets in the aggregate space. (In this case though, you
1093 cannot independently free elements.)
1095 independent_comallac differs from independent_calloc in that each
1096 element may have a different size, and also that it does not
1097 automatically clear elements.
1099 independent_comalloc can be used to speed up allocation in cases
1100 where several structs or objects must always be allocated at the
1101 same time. For example:
1103 struct Head { ... }
1104 struct Foot { ... }
1106 void send_message(char* msg) {
1107 int msglen = strlen(msg);
1108 size_t sizes[3] = { sizeof(struct Head), msglen, sizeof(struct Foot) };
1109 void* chunks[3];
1110 if (independent_comalloc(3, sizes, chunks) == 0)
1111 die();
1112 struct Head* head = (struct Head*)(chunks[0]);
1113 char* body = (char*)(chunks[1]);
1114 struct Foot* foot = (struct Foot*)(chunks[2]);
1115 // ...
1118 In general though, independent_comalloc is worth using only for
1119 larger values of n_elements. For small values, you probably won't
1120 detect enough difference from series of malloc calls to bother.
1122 Overuse of independent_comalloc can increase overall memory usage,
1123 since it cannot reuse existing noncontiguous small chunks that
1124 might be available for some of the elements.
1126 #if __STD_C
1127 Void_t** public_iCOMALLOc(size_t, size_t*, Void_t**);
1128 #else
1129 Void_t** public_iCOMALLOc();
1130 #endif
1134 pvalloc(size_t n);
1135 Equivalent to valloc(minimum-page-that-holds(n)), that is,
1136 round up n to nearest pagesize.
1138 #if __STD_C
1139 Void_t* public_pVALLOc(size_t);
1140 #else
1141 Void_t* public_pVALLOc();
1142 #endif
1145 cfree(Void_t* p);
1146 Equivalent to free(p).
1148 cfree is needed/defined on some systems that pair it with calloc,
1149 for odd historical reasons (such as: cfree is used in example
1150 code in the first edition of K&R).
1152 #if __STD_C
1153 void public_cFREe(Void_t*);
1154 #else
1155 void public_cFREe();
1156 #endif
1159 malloc_trim(size_t pad);
1161 If possible, gives memory back to the system (via negative
1162 arguments to sbrk) if there is unused memory at the `high' end of
1163 the malloc pool. You can call this after freeing large blocks of
1164 memory to potentially reduce the system-level memory requirements
1165 of a program. However, it cannot guarantee to reduce memory. Under
1166 some allocation patterns, some large free blocks of memory will be
1167 locked between two used chunks, so they cannot be given back to
1168 the system.
1170 The `pad' argument to malloc_trim represents the amount of free
1171 trailing space to leave untrimmed. If this argument is zero,
1172 only the minimum amount of memory to maintain internal data
1173 structures will be left (one page or less). Non-zero arguments
1174 can be supplied to maintain enough trailing space to service
1175 future expected allocations without having to re-obtain memory
1176 from the system.
1178 Malloc_trim returns 1 if it actually released any memory, else 0.
1179 On systems that do not support "negative sbrks", it will always
1180 rreturn 0.
1182 #if __STD_C
1183 int public_mTRIm(size_t);
1184 #else
1185 int public_mTRIm();
1186 #endif
1189 malloc_usable_size(Void_t* p);
1191 Returns the number of bytes you can actually use in
1192 an allocated chunk, which may be more than you requested (although
1193 often not) due to alignment and minimum size constraints.
1194 You can use this many bytes without worrying about
1195 overwriting other allocated objects. This is not a particularly great
1196 programming practice. malloc_usable_size can be more useful in
1197 debugging and assertions, for example:
1199 p = malloc(n);
1200 assert(malloc_usable_size(p) >= 256);
1203 #if __STD_C
1204 size_t public_mUSABLe(Void_t*);
1205 #else
1206 size_t public_mUSABLe();
1207 #endif
1210 malloc_stats();
1211 Prints on stderr the amount of space obtained from the system (both
1212 via sbrk and mmap), the maximum amount (which may be more than
1213 current if malloc_trim and/or munmap got called), and the current
1214 number of bytes allocated via malloc (or realloc, etc) but not yet
1215 freed. Note that this is the number of bytes allocated, not the
1216 number requested. It will be larger than the number requested
1217 because of alignment and bookkeeping overhead. Because it includes
1218 alignment wastage as being in use, this figure may be greater than
1219 zero even when no user-level chunks are allocated.
1221 The reported current and maximum system memory can be inaccurate if
1222 a program makes other calls to system memory allocation functions
1223 (normally sbrk) outside of malloc.
1225 malloc_stats prints only the most commonly interesting statistics.
1226 More information can be obtained by calling mallinfo.
1229 #if __STD_C
1230 void public_mSTATs(void);
1231 #else
1232 void public_mSTATs();
1233 #endif
1236 malloc_get_state(void);
1238 Returns the state of all malloc variables in an opaque data
1239 structure.
1241 #if __STD_C
1242 Void_t* public_gET_STATe(void);
1243 #else
1244 Void_t* public_gET_STATe();
1245 #endif
1248 malloc_set_state(Void_t* state);
1250 Restore the state of all malloc variables from data obtained with
1251 malloc_get_state().
1253 #if __STD_C
1254 int public_sET_STATe(Void_t*);
1255 #else
1256 int public_sET_STATe();
1257 #endif
1259 #ifdef _LIBC
1261 posix_memalign(void **memptr, size_t alignment, size_t size);
1263 POSIX wrapper like memalign(), checking for validity of size.
1265 int __posix_memalign(void **, size_t, size_t);
1266 #endif
1268 /* mallopt tuning options */
1271 M_MXFAST is the maximum request size used for "fastbins", special bins
1272 that hold returned chunks without consolidating their spaces. This
1273 enables future requests for chunks of the same size to be handled
1274 very quickly, but can increase fragmentation, and thus increase the
1275 overall memory footprint of a program.
1277 This malloc manages fastbins very conservatively yet still
1278 efficiently, so fragmentation is rarely a problem for values less
1279 than or equal to the default. The maximum supported value of MXFAST
1280 is 80. You wouldn't want it any higher than this anyway. Fastbins
1281 are designed especially for use with many small structs, objects or
1282 strings -- the default handles structs/objects/arrays with sizes up
1283 to 8 4byte fields, or small strings representing words, tokens,
1284 etc. Using fastbins for larger objects normally worsens
1285 fragmentation without improving speed.
1287 M_MXFAST is set in REQUEST size units. It is internally used in
1288 chunksize units, which adds padding and alignment. You can reduce
1289 M_MXFAST to 0 to disable all use of fastbins. This causes the malloc
1290 algorithm to be a closer approximation of fifo-best-fit in all cases,
1291 not just for larger requests, but will generally cause it to be
1292 slower.
1296 /* M_MXFAST is a standard SVID/XPG tuning option, usually listed in malloc.h */
1297 #ifndef M_MXFAST
1298 #define M_MXFAST 1
1299 #endif
1301 #ifndef DEFAULT_MXFAST
1302 #define DEFAULT_MXFAST 64
1303 #endif
1307 M_TRIM_THRESHOLD is the maximum amount of unused top-most memory
1308 to keep before releasing via malloc_trim in free().
1310 Automatic trimming is mainly useful in long-lived programs.
1311 Because trimming via sbrk can be slow on some systems, and can
1312 sometimes be wasteful (in cases where programs immediately
1313 afterward allocate more large chunks) the value should be high
1314 enough so that your overall system performance would improve by
1315 releasing this much memory.
1317 The trim threshold and the mmap control parameters (see below)
1318 can be traded off with one another. Trimming and mmapping are
1319 two different ways of releasing unused memory back to the
1320 system. Between these two, it is often possible to keep
1321 system-level demands of a long-lived program down to a bare
1322 minimum. For example, in one test suite of sessions measuring
1323 the XF86 X server on Linux, using a trim threshold of 128K and a
1324 mmap threshold of 192K led to near-minimal long term resource
1325 consumption.
1327 If you are using this malloc in a long-lived program, it should
1328 pay to experiment with these values. As a rough guide, you
1329 might set to a value close to the average size of a process
1330 (program) running on your system. Releasing this much memory
1331 would allow such a process to run in memory. Generally, it's
1332 worth it to tune for trimming rather tham memory mapping when a
1333 program undergoes phases where several large chunks are
1334 allocated and released in ways that can reuse each other's
1335 storage, perhaps mixed with phases where there are no such
1336 chunks at all. And in well-behaved long-lived programs,
1337 controlling release of large blocks via trimming versus mapping
1338 is usually faster.
1340 However, in most programs, these parameters serve mainly as
1341 protection against the system-level effects of carrying around
1342 massive amounts of unneeded memory. Since frequent calls to
1343 sbrk, mmap, and munmap otherwise degrade performance, the default
1344 parameters are set to relatively high values that serve only as
1345 safeguards.
1347 The trim value It must be greater than page size to have any useful
1348 effect. To disable trimming completely, you can set to
1349 (unsigned long)(-1)
1351 Trim settings interact with fastbin (MXFAST) settings: Unless
1352 TRIM_FASTBINS is defined, automatic trimming never takes place upon
1353 freeing a chunk with size less than or equal to MXFAST. Trimming is
1354 instead delayed until subsequent freeing of larger chunks. However,
1355 you can still force an attempted trim by calling malloc_trim.
1357 Also, trimming is not generally possible in cases where
1358 the main arena is obtained via mmap.
1360 Note that the trick some people use of mallocing a huge space and
1361 then freeing it at program startup, in an attempt to reserve system
1362 memory, doesn't have the intended effect under automatic trimming,
1363 since that memory will immediately be returned to the system.
1366 #define M_TRIM_THRESHOLD -1
1368 #ifndef DEFAULT_TRIM_THRESHOLD
1369 #define DEFAULT_TRIM_THRESHOLD (128 * 1024)
1370 #endif
1373 M_TOP_PAD is the amount of extra `padding' space to allocate or
1374 retain whenever sbrk is called. It is used in two ways internally:
1376 * When sbrk is called to extend the top of the arena to satisfy
1377 a new malloc request, this much padding is added to the sbrk
1378 request.
1380 * When malloc_trim is called automatically from free(),
1381 it is used as the `pad' argument.
1383 In both cases, the actual amount of padding is rounded
1384 so that the end of the arena is always a system page boundary.
1386 The main reason for using padding is to avoid calling sbrk so
1387 often. Having even a small pad greatly reduces the likelihood
1388 that nearly every malloc request during program start-up (or
1389 after trimming) will invoke sbrk, which needlessly wastes
1390 time.
1392 Automatic rounding-up to page-size units is normally sufficient
1393 to avoid measurable overhead, so the default is 0. However, in
1394 systems where sbrk is relatively slow, it can pay to increase
1395 this value, at the expense of carrying around more memory than
1396 the program needs.
1399 #define M_TOP_PAD -2
1401 #ifndef DEFAULT_TOP_PAD
1402 #define DEFAULT_TOP_PAD (0)
1403 #endif
1406 M_MMAP_THRESHOLD is the request size threshold for using mmap()
1407 to service a request. Requests of at least this size that cannot
1408 be allocated using already-existing space will be serviced via mmap.
1409 (If enough normal freed space already exists it is used instead.)
1411 Using mmap segregates relatively large chunks of memory so that
1412 they can be individually obtained and released from the host
1413 system. A request serviced through mmap is never reused by any
1414 other request (at least not directly; the system may just so
1415 happen to remap successive requests to the same locations).
1417 Segregating space in this way has the benefits that:
1419 1. Mmapped space can ALWAYS be individually released back
1420 to the system, which helps keep the system level memory
1421 demands of a long-lived program low.
1422 2. Mapped memory can never become `locked' between
1423 other chunks, as can happen with normally allocated chunks, which
1424 means that even trimming via malloc_trim would not release them.
1425 3. On some systems with "holes" in address spaces, mmap can obtain
1426 memory that sbrk cannot.
1428 However, it has the disadvantages that:
1430 1. The space cannot be reclaimed, consolidated, and then
1431 used to service later requests, as happens with normal chunks.
1432 2. It can lead to more wastage because of mmap page alignment
1433 requirements
1434 3. It causes malloc performance to be more dependent on host
1435 system memory management support routines which may vary in
1436 implementation quality and may impose arbitrary
1437 limitations. Generally, servicing a request via normal
1438 malloc steps is faster than going through a system's mmap.
1440 The advantages of mmap nearly always outweigh disadvantages for
1441 "large" chunks, but the value of "large" varies across systems. The
1442 default is an empirically derived value that works well in most
1443 systems.
1446 #define M_MMAP_THRESHOLD -3
1448 #ifndef DEFAULT_MMAP_THRESHOLD
1449 #define DEFAULT_MMAP_THRESHOLD (128 * 1024)
1450 #endif
1453 M_MMAP_MAX is the maximum number of requests to simultaneously
1454 service using mmap. This parameter exists because
1455 some systems have a limited number of internal tables for
1456 use by mmap, and using more than a few of them may degrade
1457 performance.
1459 The default is set to a value that serves only as a safeguard.
1460 Setting to 0 disables use of mmap for servicing large requests. If
1461 HAVE_MMAP is not set, the default value is 0, and attempts to set it
1462 to non-zero values in mallopt will fail.
1465 #define M_MMAP_MAX -4
1467 #ifndef DEFAULT_MMAP_MAX
1468 #if HAVE_MMAP
1469 #define DEFAULT_MMAP_MAX (65536)
1470 #else
1471 #define DEFAULT_MMAP_MAX (0)
1472 #endif
1473 #endif
1475 #ifdef __cplusplus
1476 } /* end of extern "C" */
1477 #endif
1479 #include <malloc.h>
1481 #ifndef BOUNDED_N
1482 #define BOUNDED_N(ptr, sz) (ptr)
1483 #endif
1484 #ifndef RETURN_ADDRESS
1485 #define RETURN_ADDRESS(X_) (NULL)
1486 #endif
1488 /* On some platforms we can compile internal, not exported functions better.
1489 Let the environment provide a macro and define it to be empty if it
1490 is not available. */
1491 #ifndef internal_function
1492 # define internal_function
1493 #endif
1495 /* Forward declarations. */
1496 struct malloc_chunk;
1497 typedef struct malloc_chunk* mchunkptr;
1499 /* Internal routines. */
1501 #if __STD_C
1503 Void_t* _int_malloc(mstate, size_t);
1504 void _int_free(mstate, Void_t*);
1505 Void_t* _int_realloc(mstate, Void_t*, size_t);
1506 Void_t* _int_memalign(mstate, size_t, size_t);
1507 Void_t* _int_valloc(mstate, size_t);
1508 static Void_t* _int_pvalloc(mstate, size_t);
1509 /*static Void_t* cALLOc(size_t, size_t);*/
1510 static Void_t** _int_icalloc(mstate, size_t, size_t, Void_t**);
1511 static Void_t** _int_icomalloc(mstate, size_t, size_t*, Void_t**);
1512 static int mTRIm(size_t);
1513 static size_t mUSABLe(Void_t*);
1514 static void mSTATs(void);
1515 static int mALLOPt(int, int);
1516 static struct mallinfo mALLINFo(mstate);
1517 static void malloc_printerr(int action, const char *str, void *ptr);
1519 static Void_t* internal_function mem2mem_check(Void_t *p, size_t sz);
1520 static int internal_function top_check(void);
1521 static void internal_function munmap_chunk(mchunkptr p);
1522 #if HAVE_MREMAP
1523 static mchunkptr internal_function mremap_chunk(mchunkptr p, size_t new_size);
1524 #endif
1526 static Void_t* malloc_check(size_t sz, const Void_t *caller);
1527 static void free_check(Void_t* mem, const Void_t *caller);
1528 static Void_t* realloc_check(Void_t* oldmem, size_t bytes,
1529 const Void_t *caller);
1530 static Void_t* memalign_check(size_t alignment, size_t bytes,
1531 const Void_t *caller);
1532 #ifndef NO_THREADS
1533 # ifdef _LIBC
1534 # if USE___THREAD || (defined USE_TLS && !defined SHARED)
1535 /* These routines are never needed in this configuration. */
1536 # define NO_STARTER
1537 # endif
1538 # endif
1539 # ifdef NO_STARTER
1540 # undef NO_STARTER
1541 # else
1542 static Void_t* malloc_starter(size_t sz, const Void_t *caller);
1543 static Void_t* memalign_starter(size_t aln, size_t sz, const Void_t *caller);
1544 static void free_starter(Void_t* mem, const Void_t *caller);
1545 # endif
1546 static Void_t* malloc_atfork(size_t sz, const Void_t *caller);
1547 static void free_atfork(Void_t* mem, const Void_t *caller);
1548 #endif
1550 #else
1552 Void_t* _int_malloc();
1553 void _int_free();
1554 Void_t* _int_realloc();
1555 Void_t* _int_memalign();
1556 Void_t* _int_valloc();
1557 Void_t* _int_pvalloc();
1558 /*static Void_t* cALLOc();*/
1559 static Void_t** _int_icalloc();
1560 static Void_t** _int_icomalloc();
1561 static int mTRIm();
1562 static size_t mUSABLe();
1563 static void mSTATs();
1564 static int mALLOPt();
1565 static struct mallinfo mALLINFo();
1567 #endif
1572 /* ------------- Optional versions of memcopy ---------------- */
1575 #if USE_MEMCPY
1578 Note: memcpy is ONLY invoked with non-overlapping regions,
1579 so the (usually slower) memmove is not needed.
1582 #define MALLOC_COPY(dest, src, nbytes) memcpy(dest, src, nbytes)
1583 #define MALLOC_ZERO(dest, nbytes) memset(dest, 0, nbytes)
1585 #else /* !USE_MEMCPY */
1587 /* Use Duff's device for good zeroing/copying performance. */
1589 #define MALLOC_ZERO(charp, nbytes) \
1590 do { \
1591 INTERNAL_SIZE_T* mzp = (INTERNAL_SIZE_T*)(charp); \
1592 unsigned long mctmp = (nbytes)/sizeof(INTERNAL_SIZE_T); \
1593 long mcn; \
1594 if (mctmp < 8) mcn = 0; else { mcn = (mctmp-1)/8; mctmp %= 8; } \
1595 switch (mctmp) { \
1596 case 0: for(;;) { *mzp++ = 0; \
1597 case 7: *mzp++ = 0; \
1598 case 6: *mzp++ = 0; \
1599 case 5: *mzp++ = 0; \
1600 case 4: *mzp++ = 0; \
1601 case 3: *mzp++ = 0; \
1602 case 2: *mzp++ = 0; \
1603 case 1: *mzp++ = 0; if(mcn <= 0) break; mcn--; } \
1605 } while(0)
1607 #define MALLOC_COPY(dest,src,nbytes) \
1608 do { \
1609 INTERNAL_SIZE_T* mcsrc = (INTERNAL_SIZE_T*) src; \
1610 INTERNAL_SIZE_T* mcdst = (INTERNAL_SIZE_T*) dest; \
1611 unsigned long mctmp = (nbytes)/sizeof(INTERNAL_SIZE_T); \
1612 long mcn; \
1613 if (mctmp < 8) mcn = 0; else { mcn = (mctmp-1)/8; mctmp %= 8; } \
1614 switch (mctmp) { \
1615 case 0: for(;;) { *mcdst++ = *mcsrc++; \
1616 case 7: *mcdst++ = *mcsrc++; \
1617 case 6: *mcdst++ = *mcsrc++; \
1618 case 5: *mcdst++ = *mcsrc++; \
1619 case 4: *mcdst++ = *mcsrc++; \
1620 case 3: *mcdst++ = *mcsrc++; \
1621 case 2: *mcdst++ = *mcsrc++; \
1622 case 1: *mcdst++ = *mcsrc++; if(mcn <= 0) break; mcn--; } \
1624 } while(0)
1626 #endif
1628 /* ------------------ MMAP support ------------------ */
1631 #if HAVE_MMAP
1633 #include <fcntl.h>
1634 #ifndef LACKS_SYS_MMAN_H
1635 #include <sys/mman.h>
1636 #endif
1638 #if !defined(MAP_ANONYMOUS) && defined(MAP_ANON)
1639 # define MAP_ANONYMOUS MAP_ANON
1640 #endif
1641 #if !defined(MAP_FAILED)
1642 # define MAP_FAILED ((char*)-1)
1643 #endif
1645 #ifndef MAP_NORESERVE
1646 # ifdef MAP_AUTORESRV
1647 # define MAP_NORESERVE MAP_AUTORESRV
1648 # else
1649 # define MAP_NORESERVE 0
1650 # endif
1651 #endif
1654 Nearly all versions of mmap support MAP_ANONYMOUS,
1655 so the following is unlikely to be needed, but is
1656 supplied just in case.
1659 #ifndef MAP_ANONYMOUS
1661 static int dev_zero_fd = -1; /* Cached file descriptor for /dev/zero. */
1663 #define MMAP(addr, size, prot, flags) ((dev_zero_fd < 0) ? \
1664 (dev_zero_fd = open("/dev/zero", O_RDWR), \
1665 mmap((addr), (size), (prot), (flags), dev_zero_fd, 0)) : \
1666 mmap((addr), (size), (prot), (flags), dev_zero_fd, 0))
1668 #else
1670 #define MMAP(addr, size, prot, flags) \
1671 (mmap((addr), (size), (prot), (flags)|MAP_ANONYMOUS, -1, 0))
1673 #endif
1676 #endif /* HAVE_MMAP */
1680 ----------------------- Chunk representations -----------------------
1685 This struct declaration is misleading (but accurate and necessary).
1686 It declares a "view" into memory allowing access to necessary
1687 fields at known offsets from a given base. See explanation below.
1690 struct malloc_chunk {
1692 INTERNAL_SIZE_T prev_size; /* Size of previous chunk (if free). */
1693 INTERNAL_SIZE_T size; /* Size in bytes, including overhead. */
1695 struct malloc_chunk* fd; /* double links -- used only if free. */
1696 struct malloc_chunk* bk;
1701 malloc_chunk details:
1703 (The following includes lightly edited explanations by Colin Plumb.)
1705 Chunks of memory are maintained using a `boundary tag' method as
1706 described in e.g., Knuth or Standish. (See the paper by Paul
1707 Wilson ftp://ftp.cs.utexas.edu/pub/garbage/allocsrv.ps for a
1708 survey of such techniques.) Sizes of free chunks are stored both
1709 in the front of each chunk and at the end. This makes
1710 consolidating fragmented chunks into bigger chunks very fast. The
1711 size fields also hold bits representing whether chunks are free or
1712 in use.
1714 An allocated chunk looks like this:
1717 chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1718 | Size of previous chunk, if allocated | |
1719 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1720 | Size of chunk, in bytes |M|P|
1721 mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1722 | User data starts here... .
1724 . (malloc_usable_space() bytes) .
1726 nextchunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1727 | Size of chunk |
1728 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1731 Where "chunk" is the front of the chunk for the purpose of most of
1732 the malloc code, but "mem" is the pointer that is returned to the
1733 user. "Nextchunk" is the beginning of the next contiguous chunk.
1735 Chunks always begin on even word boundries, so the mem portion
1736 (which is returned to the user) is also on an even word boundary, and
1737 thus at least double-word aligned.
1739 Free chunks are stored in circular doubly-linked lists, and look like this:
1741 chunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1742 | Size of previous chunk |
1743 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1744 `head:' | Size of chunk, in bytes |P|
1745 mem-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1746 | Forward pointer to next chunk in list |
1747 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1748 | Back pointer to previous chunk in list |
1749 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1750 | Unused space (may be 0 bytes long) .
1753 nextchunk-> +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1754 `foot:' | Size of chunk, in bytes |
1755 +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
1757 The P (PREV_INUSE) bit, stored in the unused low-order bit of the
1758 chunk size (which is always a multiple of two words), is an in-use
1759 bit for the *previous* chunk. If that bit is *clear*, then the
1760 word before the current chunk size contains the previous chunk
1761 size, and can be used to find the front of the previous chunk.
1762 The very first chunk allocated always has this bit set,
1763 preventing access to non-existent (or non-owned) memory. If
1764 prev_inuse is set for any given chunk, then you CANNOT determine
1765 the size of the previous chunk, and might even get a memory
1766 addressing fault when trying to do so.
1768 Note that the `foot' of the current chunk is actually represented
1769 as the prev_size of the NEXT chunk. This makes it easier to
1770 deal with alignments etc but can be very confusing when trying
1771 to extend or adapt this code.
1773 The two exceptions to all this are
1775 1. The special chunk `top' doesn't bother using the
1776 trailing size field since there is no next contiguous chunk
1777 that would have to index off it. After initialization, `top'
1778 is forced to always exist. If it would become less than
1779 MINSIZE bytes long, it is replenished.
1781 2. Chunks allocated via mmap, which have the second-lowest-order
1782 bit M (IS_MMAPPED) set in their size fields. Because they are
1783 allocated one-by-one, each must contain its own trailing size field.
1788 ---------- Size and alignment checks and conversions ----------
1791 /* conversion from malloc headers to user pointers, and back */
1793 #define chunk2mem(p) ((Void_t*)((char*)(p) + 2*SIZE_SZ))
1794 #define mem2chunk(mem) ((mchunkptr)((char*)(mem) - 2*SIZE_SZ))
1796 /* The smallest possible chunk */
1797 #define MIN_CHUNK_SIZE (sizeof(struct malloc_chunk))
1799 /* The smallest size we can malloc is an aligned minimal chunk */
1801 #define MINSIZE \
1802 (unsigned long)(((MIN_CHUNK_SIZE+MALLOC_ALIGN_MASK) & ~MALLOC_ALIGN_MASK))
1804 /* Check if m has acceptable alignment */
1806 #define aligned_OK(m) (((unsigned long)((m)) & (MALLOC_ALIGN_MASK)) == 0)
1810 Check if a request is so large that it would wrap around zero when
1811 padded and aligned. To simplify some other code, the bound is made
1812 low enough so that adding MINSIZE will also not wrap around zero.
1815 #define REQUEST_OUT_OF_RANGE(req) \
1816 ((unsigned long)(req) >= \
1817 (unsigned long)(INTERNAL_SIZE_T)(-2 * MINSIZE))
1819 /* pad request bytes into a usable size -- internal version */
1821 #define request2size(req) \
1822 (((req) + SIZE_SZ + MALLOC_ALIGN_MASK < MINSIZE) ? \
1823 MINSIZE : \
1824 ((req) + SIZE_SZ + MALLOC_ALIGN_MASK) & ~MALLOC_ALIGN_MASK)
1826 /* Same, except also perform argument check */
1828 #define checked_request2size(req, sz) \
1829 if (REQUEST_OUT_OF_RANGE(req)) { \
1830 MALLOC_FAILURE_ACTION; \
1831 return 0; \
1833 (sz) = request2size(req);
1836 --------------- Physical chunk operations ---------------
1840 /* size field is or'ed with PREV_INUSE when previous adjacent chunk in use */
1841 #define PREV_INUSE 0x1
1843 /* extract inuse bit of previous chunk */
1844 #define prev_inuse(p) ((p)->size & PREV_INUSE)
1847 /* size field is or'ed with IS_MMAPPED if the chunk was obtained with mmap() */
1848 #define IS_MMAPPED 0x2
1850 /* check for mmap()'ed chunk */
1851 #define chunk_is_mmapped(p) ((p)->size & IS_MMAPPED)
1854 /* size field is or'ed with NON_MAIN_ARENA if the chunk was obtained
1855 from a non-main arena. This is only set immediately before handing
1856 the chunk to the user, if necessary. */
1857 #define NON_MAIN_ARENA 0x4
1859 /* check for chunk from non-main arena */
1860 #define chunk_non_main_arena(p) ((p)->size & NON_MAIN_ARENA)
1864 Bits to mask off when extracting size
1866 Note: IS_MMAPPED is intentionally not masked off from size field in
1867 macros for which mmapped chunks should never be seen. This should
1868 cause helpful core dumps to occur if it is tried by accident by
1869 people extending or adapting this malloc.
1871 #define SIZE_BITS (PREV_INUSE|IS_MMAPPED|NON_MAIN_ARENA)
1873 /* Get size, ignoring use bits */
1874 #define chunksize(p) ((p)->size & ~(SIZE_BITS))
1877 /* Ptr to next physical malloc_chunk. */
1878 #define next_chunk(p) ((mchunkptr)( ((char*)(p)) + ((p)->size & ~SIZE_BITS) ))
1880 /* Ptr to previous physical malloc_chunk */
1881 #define prev_chunk(p) ((mchunkptr)( ((char*)(p)) - ((p)->prev_size) ))
1883 /* Treat space at ptr + offset as a chunk */
1884 #define chunk_at_offset(p, s) ((mchunkptr)(((char*)(p)) + (s)))
1886 /* extract p's inuse bit */
1887 #define inuse(p)\
1888 ((((mchunkptr)(((char*)(p))+((p)->size & ~SIZE_BITS)))->size) & PREV_INUSE)
1890 /* set/clear chunk as being inuse without otherwise disturbing */
1891 #define set_inuse(p)\
1892 ((mchunkptr)(((char*)(p)) + ((p)->size & ~SIZE_BITS)))->size |= PREV_INUSE
1894 #define clear_inuse(p)\
1895 ((mchunkptr)(((char*)(p)) + ((p)->size & ~SIZE_BITS)))->size &= ~(PREV_INUSE)
1898 /* check/set/clear inuse bits in known places */
1899 #define inuse_bit_at_offset(p, s)\
1900 (((mchunkptr)(((char*)(p)) + (s)))->size & PREV_INUSE)
1902 #define set_inuse_bit_at_offset(p, s)\
1903 (((mchunkptr)(((char*)(p)) + (s)))->size |= PREV_INUSE)
1905 #define clear_inuse_bit_at_offset(p, s)\
1906 (((mchunkptr)(((char*)(p)) + (s)))->size &= ~(PREV_INUSE))
1909 /* Set size at head, without disturbing its use bit */
1910 #define set_head_size(p, s) ((p)->size = (((p)->size & SIZE_BITS) | (s)))
1912 /* Set size/use field */
1913 #define set_head(p, s) ((p)->size = (s))
1915 /* Set size at footer (only when chunk is not in use) */
1916 #define set_foot(p, s) (((mchunkptr)((char*)(p) + (s)))->prev_size = (s))
1920 -------------------- Internal data structures --------------------
1922 All internal state is held in an instance of malloc_state defined
1923 below. There are no other static variables, except in two optional
1924 cases:
1925 * If USE_MALLOC_LOCK is defined, the mALLOC_MUTEx declared above.
1926 * If HAVE_MMAP is true, but mmap doesn't support
1927 MAP_ANONYMOUS, a dummy file descriptor for mmap.
1929 Beware of lots of tricks that minimize the total bookkeeping space
1930 requirements. The result is a little over 1K bytes (for 4byte
1931 pointers and size_t.)
1935 Bins
1937 An array of bin headers for free chunks. Each bin is doubly
1938 linked. The bins are approximately proportionally (log) spaced.
1939 There are a lot of these bins (128). This may look excessive, but
1940 works very well in practice. Most bins hold sizes that are
1941 unusual as malloc request sizes, but are more usual for fragments
1942 and consolidated sets of chunks, which is what these bins hold, so
1943 they can be found quickly. All procedures maintain the invariant
1944 that no consolidated chunk physically borders another one, so each
1945 chunk in a list is known to be preceeded and followed by either
1946 inuse chunks or the ends of memory.
1948 Chunks in bins are kept in size order, with ties going to the
1949 approximately least recently used chunk. Ordering isn't needed
1950 for the small bins, which all contain the same-sized chunks, but
1951 facilitates best-fit allocation for larger chunks. These lists
1952 are just sequential. Keeping them in order almost never requires
1953 enough traversal to warrant using fancier ordered data
1954 structures.
1956 Chunks of the same size are linked with the most
1957 recently freed at the front, and allocations are taken from the
1958 back. This results in LRU (FIFO) allocation order, which tends
1959 to give each chunk an equal opportunity to be consolidated with
1960 adjacent freed chunks, resulting in larger free chunks and less
1961 fragmentation.
1963 To simplify use in double-linked lists, each bin header acts
1964 as a malloc_chunk. This avoids special-casing for headers.
1965 But to conserve space and improve locality, we allocate
1966 only the fd/bk pointers of bins, and then use repositioning tricks
1967 to treat these as the fields of a malloc_chunk*.
1970 typedef struct malloc_chunk* mbinptr;
1972 /* addressing -- note that bin_at(0) does not exist */
1973 #define bin_at(m, i) ((mbinptr)((char*)&((m)->bins[(i)<<1]) - (SIZE_SZ<<1)))
1975 /* analog of ++bin */
1976 #define next_bin(b) ((mbinptr)((char*)(b) + (sizeof(mchunkptr)<<1)))
1978 /* Reminders about list directionality within bins */
1979 #define first(b) ((b)->fd)
1980 #define last(b) ((b)->bk)
1982 /* Take a chunk off a bin list */
1983 #define unlink(P, BK, FD) { \
1984 FD = P->fd; \
1985 BK = P->bk; \
1986 if (__builtin_expect (FD->bk != P || BK->fd != P, 0)) \
1987 malloc_printerr (check_action, "corrupted double-linked list", P); \
1988 else { \
1989 FD->bk = BK; \
1990 BK->fd = FD; \
1995 Indexing
1997 Bins for sizes < 512 bytes contain chunks of all the same size, spaced
1998 8 bytes apart. Larger bins are approximately logarithmically spaced:
2000 64 bins of size 8
2001 32 bins of size 64
2002 16 bins of size 512
2003 8 bins of size 4096
2004 4 bins of size 32768
2005 2 bins of size 262144
2006 1 bin of size what's left
2008 There is actually a little bit of slop in the numbers in bin_index
2009 for the sake of speed. This makes no difference elsewhere.
2011 The bins top out around 1MB because we expect to service large
2012 requests via mmap.
2015 #define NBINS 128
2016 #define NSMALLBINS 64
2017 #define SMALLBIN_WIDTH 8
2018 #define MIN_LARGE_SIZE 512
2020 #define in_smallbin_range(sz) \
2021 ((unsigned long)(sz) < (unsigned long)MIN_LARGE_SIZE)
2023 #define smallbin_index(sz) (((unsigned)(sz)) >> 3)
2025 #define largebin_index(sz) \
2026 (((((unsigned long)(sz)) >> 6) <= 32)? 56 + (((unsigned long)(sz)) >> 6): \
2027 ((((unsigned long)(sz)) >> 9) <= 20)? 91 + (((unsigned long)(sz)) >> 9): \
2028 ((((unsigned long)(sz)) >> 12) <= 10)? 110 + (((unsigned long)(sz)) >> 12): \
2029 ((((unsigned long)(sz)) >> 15) <= 4)? 119 + (((unsigned long)(sz)) >> 15): \
2030 ((((unsigned long)(sz)) >> 18) <= 2)? 124 + (((unsigned long)(sz)) >> 18): \
2031 126)
2033 #define bin_index(sz) \
2034 ((in_smallbin_range(sz)) ? smallbin_index(sz) : largebin_index(sz))
2038 Unsorted chunks
2040 All remainders from chunk splits, as well as all returned chunks,
2041 are first placed in the "unsorted" bin. They are then placed
2042 in regular bins after malloc gives them ONE chance to be used before
2043 binning. So, basically, the unsorted_chunks list acts as a queue,
2044 with chunks being placed on it in free (and malloc_consolidate),
2045 and taken off (to be either used or placed in bins) in malloc.
2047 The NON_MAIN_ARENA flag is never set for unsorted chunks, so it
2048 does not have to be taken into account in size comparisons.
2051 /* The otherwise unindexable 1-bin is used to hold unsorted chunks. */
2052 #define unsorted_chunks(M) (bin_at(M, 1))
2057 The top-most available chunk (i.e., the one bordering the end of
2058 available memory) is treated specially. It is never included in
2059 any bin, is used only if no other chunk is available, and is
2060 released back to the system if it is very large (see
2061 M_TRIM_THRESHOLD). Because top initially
2062 points to its own bin with initial zero size, thus forcing
2063 extension on the first malloc request, we avoid having any special
2064 code in malloc to check whether it even exists yet. But we still
2065 need to do so when getting memory from system, so we make
2066 initial_top treat the bin as a legal but unusable chunk during the
2067 interval between initialization and the first call to
2068 sYSMALLOc. (This is somewhat delicate, since it relies on
2069 the 2 preceding words to be zero during this interval as well.)
2072 /* Conveniently, the unsorted bin can be used as dummy top on first call */
2073 #define initial_top(M) (unsorted_chunks(M))
2076 Binmap
2078 To help compensate for the large number of bins, a one-level index
2079 structure is used for bin-by-bin searching. `binmap' is a
2080 bitvector recording whether bins are definitely empty so they can
2081 be skipped over during during traversals. The bits are NOT always
2082 cleared as soon as bins are empty, but instead only
2083 when they are noticed to be empty during traversal in malloc.
2086 /* Conservatively use 32 bits per map word, even if on 64bit system */
2087 #define BINMAPSHIFT 5
2088 #define BITSPERMAP (1U << BINMAPSHIFT)
2089 #define BINMAPSIZE (NBINS / BITSPERMAP)
2091 #define idx2block(i) ((i) >> BINMAPSHIFT)
2092 #define idx2bit(i) ((1U << ((i) & ((1U << BINMAPSHIFT)-1))))
2094 #define mark_bin(m,i) ((m)->binmap[idx2block(i)] |= idx2bit(i))
2095 #define unmark_bin(m,i) ((m)->binmap[idx2block(i)] &= ~(idx2bit(i)))
2096 #define get_binmap(m,i) ((m)->binmap[idx2block(i)] & idx2bit(i))
2099 Fastbins
2101 An array of lists holding recently freed small chunks. Fastbins
2102 are not doubly linked. It is faster to single-link them, and
2103 since chunks are never removed from the middles of these lists,
2104 double linking is not necessary. Also, unlike regular bins, they
2105 are not even processed in FIFO order (they use faster LIFO) since
2106 ordering doesn't much matter in the transient contexts in which
2107 fastbins are normally used.
2109 Chunks in fastbins keep their inuse bit set, so they cannot
2110 be consolidated with other free chunks. malloc_consolidate
2111 releases all chunks in fastbins and consolidates them with
2112 other free chunks.
2115 typedef struct malloc_chunk* mfastbinptr;
2117 /* offset 2 to use otherwise unindexable first 2 bins */
2118 #define fastbin_index(sz) ((((unsigned int)(sz)) >> 3) - 2)
2120 /* The maximum fastbin request size we support */
2121 #define MAX_FAST_SIZE 80
2123 #define NFASTBINS (fastbin_index(request2size(MAX_FAST_SIZE))+1)
2126 FASTBIN_CONSOLIDATION_THRESHOLD is the size of a chunk in free()
2127 that triggers automatic consolidation of possibly-surrounding
2128 fastbin chunks. This is a heuristic, so the exact value should not
2129 matter too much. It is defined at half the default trim threshold as a
2130 compromise heuristic to only attempt consolidation if it is likely
2131 to lead to trimming. However, it is not dynamically tunable, since
2132 consolidation reduces fragmentation surrounding large chunks even
2133 if trimming is not used.
2136 #define FASTBIN_CONSOLIDATION_THRESHOLD (65536UL)
2139 Since the lowest 2 bits in max_fast don't matter in size comparisons,
2140 they are used as flags.
2144 FASTCHUNKS_BIT held in max_fast indicates that there are probably
2145 some fastbin chunks. It is set true on entering a chunk into any
2146 fastbin, and cleared only in malloc_consolidate.
2148 The truth value is inverted so that have_fastchunks will be true
2149 upon startup (since statics are zero-filled), simplifying
2150 initialization checks.
2153 #define FASTCHUNKS_BIT (1U)
2155 #define have_fastchunks(M) (((M)->max_fast & FASTCHUNKS_BIT) == 0)
2156 #define clear_fastchunks(M) ((M)->max_fast |= FASTCHUNKS_BIT)
2157 #define set_fastchunks(M) ((M)->max_fast &= ~FASTCHUNKS_BIT)
2160 NONCONTIGUOUS_BIT indicates that MORECORE does not return contiguous
2161 regions. Otherwise, contiguity is exploited in merging together,
2162 when possible, results from consecutive MORECORE calls.
2164 The initial value comes from MORECORE_CONTIGUOUS, but is
2165 changed dynamically if mmap is ever used as an sbrk substitute.
2168 #define NONCONTIGUOUS_BIT (2U)
2170 #define contiguous(M) (((M)->max_fast & NONCONTIGUOUS_BIT) == 0)
2171 #define noncontiguous(M) (((M)->max_fast & NONCONTIGUOUS_BIT) != 0)
2172 #define set_noncontiguous(M) ((M)->max_fast |= NONCONTIGUOUS_BIT)
2173 #define set_contiguous(M) ((M)->max_fast &= ~NONCONTIGUOUS_BIT)
2176 Set value of max_fast.
2177 Use impossibly small value if 0.
2178 Precondition: there are no existing fastbin chunks.
2179 Setting the value clears fastchunk bit but preserves noncontiguous bit.
2182 #define set_max_fast(M, s) \
2183 (M)->max_fast = (((s) == 0)? SMALLBIN_WIDTH: request2size(s)) | \
2184 FASTCHUNKS_BIT | \
2185 ((M)->max_fast & NONCONTIGUOUS_BIT)
2189 ----------- Internal state representation and initialization -----------
2192 struct malloc_state {
2193 /* Serialize access. */
2194 mutex_t mutex;
2195 // Should we have padding to move the mutex to its own cache line?
2197 #if THREAD_STATS
2198 /* Statistics for locking. Only used if THREAD_STATS is defined. */
2199 long stat_lock_direct, stat_lock_loop, stat_lock_wait;
2200 #endif
2202 /* The maximum chunk size to be eligible for fastbin */
2203 INTERNAL_SIZE_T max_fast; /* low 2 bits used as flags */
2205 /* Fastbins */
2206 mfastbinptr fastbins[NFASTBINS];
2208 /* Base of the topmost chunk -- not otherwise kept in a bin */
2209 mchunkptr top;
2211 /* The remainder from the most recent split of a small request */
2212 mchunkptr last_remainder;
2214 /* Normal bins packed as described above */
2215 mchunkptr bins[NBINS * 2];
2217 /* Bitmap of bins */
2218 unsigned int binmap[BINMAPSIZE];
2220 /* Linked list */
2221 struct malloc_state *next;
2223 /* Memory allocated from the system in this arena. */
2224 INTERNAL_SIZE_T system_mem;
2225 INTERNAL_SIZE_T max_system_mem;
2228 struct malloc_par {
2229 /* Tunable parameters */
2230 unsigned long trim_threshold;
2231 INTERNAL_SIZE_T top_pad;
2232 INTERNAL_SIZE_T mmap_threshold;
2234 /* Memory map support */
2235 int n_mmaps;
2236 int n_mmaps_max;
2237 int max_n_mmaps;
2239 /* Cache malloc_getpagesize */
2240 unsigned int pagesize;
2242 /* Statistics */
2243 INTERNAL_SIZE_T mmapped_mem;
2244 /*INTERNAL_SIZE_T sbrked_mem;*/
2245 /*INTERNAL_SIZE_T max_sbrked_mem;*/
2246 INTERNAL_SIZE_T max_mmapped_mem;
2247 INTERNAL_SIZE_T max_total_mem; /* only kept for NO_THREADS */
2249 /* First address handed out by MORECORE/sbrk. */
2250 char* sbrk_base;
2253 /* There are several instances of this struct ("arenas") in this
2254 malloc. If you are adapting this malloc in a way that does NOT use
2255 a static or mmapped malloc_state, you MUST explicitly zero-fill it
2256 before using. This malloc relies on the property that malloc_state
2257 is initialized to all zeroes (as is true of C statics). */
2259 static struct malloc_state main_arena;
2261 /* There is only one instance of the malloc parameters. */
2263 static struct malloc_par mp_;
2266 Initialize a malloc_state struct.
2268 This is called only from within malloc_consolidate, which needs
2269 be called in the same contexts anyway. It is never called directly
2270 outside of malloc_consolidate because some optimizing compilers try
2271 to inline it at all call points, which turns out not to be an
2272 optimization at all. (Inlining it in malloc_consolidate is fine though.)
2275 #if __STD_C
2276 static void malloc_init_state(mstate av)
2277 #else
2278 static void malloc_init_state(av) mstate av;
2279 #endif
2281 int i;
2282 mbinptr bin;
2284 /* Establish circular links for normal bins */
2285 for (i = 1; i < NBINS; ++i) {
2286 bin = bin_at(av,i);
2287 bin->fd = bin->bk = bin;
2290 #if MORECORE_CONTIGUOUS
2291 if (av != &main_arena)
2292 #endif
2293 set_noncontiguous(av);
2295 set_max_fast(av, DEFAULT_MXFAST);
2297 av->top = initial_top(av);
2301 Other internal utilities operating on mstates
2304 #if __STD_C
2305 static Void_t* sYSMALLOc(INTERNAL_SIZE_T, mstate);
2306 static int sYSTRIm(size_t, mstate);
2307 static void malloc_consolidate(mstate);
2308 static Void_t** iALLOc(mstate, size_t, size_t*, int, Void_t**);
2309 #else
2310 static Void_t* sYSMALLOc();
2311 static int sYSTRIm();
2312 static void malloc_consolidate();
2313 static Void_t** iALLOc();
2314 #endif
2317 /* -------------- Early definitions for debugging hooks ---------------- */
2319 /* Define and initialize the hook variables. These weak definitions must
2320 appear before any use of the variables in a function (arena.c uses one). */
2321 #ifndef weak_variable
2322 #ifndef _LIBC
2323 #define weak_variable /**/
2324 #else
2325 /* In GNU libc we want the hook variables to be weak definitions to
2326 avoid a problem with Emacs. */
2327 #define weak_variable weak_function
2328 #endif
2329 #endif
2331 /* Forward declarations. */
2332 static Void_t* malloc_hook_ini __MALLOC_P ((size_t sz,
2333 const __malloc_ptr_t caller));
2334 static Void_t* realloc_hook_ini __MALLOC_P ((Void_t* ptr, size_t sz,
2335 const __malloc_ptr_t caller));
2336 static Void_t* memalign_hook_ini __MALLOC_P ((size_t alignment, size_t sz,
2337 const __malloc_ptr_t caller));
2339 void weak_variable (*__malloc_initialize_hook) (void) = NULL;
2340 void weak_variable (*__free_hook) (__malloc_ptr_t __ptr,
2341 const __malloc_ptr_t) = NULL;
2342 __malloc_ptr_t weak_variable (*__malloc_hook)
2343 (size_t __size, const __malloc_ptr_t) = malloc_hook_ini;
2344 __malloc_ptr_t weak_variable (*__realloc_hook)
2345 (__malloc_ptr_t __ptr, size_t __size, const __malloc_ptr_t)
2346 = realloc_hook_ini;
2347 __malloc_ptr_t weak_variable (*__memalign_hook)
2348 (size_t __alignment, size_t __size, const __malloc_ptr_t)
2349 = memalign_hook_ini;
2350 void weak_variable (*__after_morecore_hook) (void) = NULL;
2353 /* ---------------- Error behavior ------------------------------------ */
2355 #ifndef DEFAULT_CHECK_ACTION
2356 #define DEFAULT_CHECK_ACTION 3
2357 #endif
2359 static int check_action = DEFAULT_CHECK_ACTION;
2362 /* ------------------- Support for multiple arenas -------------------- */
2363 #include "arena.c"
2366 Debugging support
2368 These routines make a number of assertions about the states
2369 of data structures that should be true at all times. If any
2370 are not true, it's very likely that a user program has somehow
2371 trashed memory. (It's also possible that there is a coding error
2372 in malloc. In which case, please report it!)
2375 #if ! MALLOC_DEBUG
2377 #define check_chunk(A,P)
2378 #define check_free_chunk(A,P)
2379 #define check_inuse_chunk(A,P)
2380 #define check_remalloced_chunk(A,P,N)
2381 #define check_malloced_chunk(A,P,N)
2382 #define check_malloc_state(A)
2384 #else
2386 #define check_chunk(A,P) do_check_chunk(A,P)
2387 #define check_free_chunk(A,P) do_check_free_chunk(A,P)
2388 #define check_inuse_chunk(A,P) do_check_inuse_chunk(A,P)
2389 #define check_remalloced_chunk(A,P,N) do_check_remalloced_chunk(A,P,N)
2390 #define check_malloced_chunk(A,P,N) do_check_malloced_chunk(A,P,N)
2391 #define check_malloc_state(A) do_check_malloc_state(A)
2394 Properties of all chunks
2397 #if __STD_C
2398 static void do_check_chunk(mstate av, mchunkptr p)
2399 #else
2400 static void do_check_chunk(av, p) mstate av; mchunkptr p;
2401 #endif
2403 unsigned long sz = chunksize(p);
2404 /* min and max possible addresses assuming contiguous allocation */
2405 char* max_address = (char*)(av->top) + chunksize(av->top);
2406 char* min_address = max_address - av->system_mem;
2408 if (!chunk_is_mmapped(p)) {
2410 /* Has legal address ... */
2411 if (p != av->top) {
2412 if (contiguous(av)) {
2413 assert(((char*)p) >= min_address);
2414 assert(((char*)p + sz) <= ((char*)(av->top)));
2417 else {
2418 /* top size is always at least MINSIZE */
2419 assert((unsigned long)(sz) >= MINSIZE);
2420 /* top predecessor always marked inuse */
2421 assert(prev_inuse(p));
2425 else {
2426 #if HAVE_MMAP
2427 /* address is outside main heap */
2428 if (contiguous(av) && av->top != initial_top(av)) {
2429 assert(((char*)p) < min_address || ((char*)p) > max_address);
2431 /* chunk is page-aligned */
2432 assert(((p->prev_size + sz) & (mp_.pagesize-1)) == 0);
2433 /* mem is aligned */
2434 assert(aligned_OK(chunk2mem(p)));
2435 #else
2436 /* force an appropriate assert violation if debug set */
2437 assert(!chunk_is_mmapped(p));
2438 #endif
2443 Properties of free chunks
2446 #if __STD_C
2447 static void do_check_free_chunk(mstate av, mchunkptr p)
2448 #else
2449 static void do_check_free_chunk(av, p) mstate av; mchunkptr p;
2450 #endif
2452 INTERNAL_SIZE_T sz = p->size & ~(PREV_INUSE|NON_MAIN_ARENA);
2453 mchunkptr next = chunk_at_offset(p, sz);
2455 do_check_chunk(av, p);
2457 /* Chunk must claim to be free ... */
2458 assert(!inuse(p));
2459 assert (!chunk_is_mmapped(p));
2461 /* Unless a special marker, must have OK fields */
2462 if ((unsigned long)(sz) >= MINSIZE)
2464 assert((sz & MALLOC_ALIGN_MASK) == 0);
2465 assert(aligned_OK(chunk2mem(p)));
2466 /* ... matching footer field */
2467 assert(next->prev_size == sz);
2468 /* ... and is fully consolidated */
2469 assert(prev_inuse(p));
2470 assert (next == av->top || inuse(next));
2472 /* ... and has minimally sane links */
2473 assert(p->fd->bk == p);
2474 assert(p->bk->fd == p);
2476 else /* markers are always of size SIZE_SZ */
2477 assert(sz == SIZE_SZ);
2481 Properties of inuse chunks
2484 #if __STD_C
2485 static void do_check_inuse_chunk(mstate av, mchunkptr p)
2486 #else
2487 static void do_check_inuse_chunk(av, p) mstate av; mchunkptr p;
2488 #endif
2490 mchunkptr next;
2492 do_check_chunk(av, p);
2494 if (chunk_is_mmapped(p))
2495 return; /* mmapped chunks have no next/prev */
2497 /* Check whether it claims to be in use ... */
2498 assert(inuse(p));
2500 next = next_chunk(p);
2502 /* ... and is surrounded by OK chunks.
2503 Since more things can be checked with free chunks than inuse ones,
2504 if an inuse chunk borders them and debug is on, it's worth doing them.
2506 if (!prev_inuse(p)) {
2507 /* Note that we cannot even look at prev unless it is not inuse */
2508 mchunkptr prv = prev_chunk(p);
2509 assert(next_chunk(prv) == p);
2510 do_check_free_chunk(av, prv);
2513 if (next == av->top) {
2514 assert(prev_inuse(next));
2515 assert(chunksize(next) >= MINSIZE);
2517 else if (!inuse(next))
2518 do_check_free_chunk(av, next);
2522 Properties of chunks recycled from fastbins
2525 #if __STD_C
2526 static void do_check_remalloced_chunk(mstate av, mchunkptr p, INTERNAL_SIZE_T s)
2527 #else
2528 static void do_check_remalloced_chunk(av, p, s)
2529 mstate av; mchunkptr p; INTERNAL_SIZE_T s;
2530 #endif
2532 INTERNAL_SIZE_T sz = p->size & ~(PREV_INUSE|NON_MAIN_ARENA);
2534 if (!chunk_is_mmapped(p)) {
2535 assert(av == arena_for_chunk(p));
2536 if (chunk_non_main_arena(p))
2537 assert(av != &main_arena);
2538 else
2539 assert(av == &main_arena);
2542 do_check_inuse_chunk(av, p);
2544 /* Legal size ... */
2545 assert((sz & MALLOC_ALIGN_MASK) == 0);
2546 assert((unsigned long)(sz) >= MINSIZE);
2547 /* ... and alignment */
2548 assert(aligned_OK(chunk2mem(p)));
2549 /* chunk is less than MINSIZE more than request */
2550 assert((long)(sz) - (long)(s) >= 0);
2551 assert((long)(sz) - (long)(s + MINSIZE) < 0);
2555 Properties of nonrecycled chunks at the point they are malloced
2558 #if __STD_C
2559 static void do_check_malloced_chunk(mstate av, mchunkptr p, INTERNAL_SIZE_T s)
2560 #else
2561 static void do_check_malloced_chunk(av, p, s)
2562 mstate av; mchunkptr p; INTERNAL_SIZE_T s;
2563 #endif
2565 /* same as recycled case ... */
2566 do_check_remalloced_chunk(av, p, s);
2569 ... plus, must obey implementation invariant that prev_inuse is
2570 always true of any allocated chunk; i.e., that each allocated
2571 chunk borders either a previously allocated and still in-use
2572 chunk, or the base of its memory arena. This is ensured
2573 by making all allocations from the the `lowest' part of any found
2574 chunk. This does not necessarily hold however for chunks
2575 recycled via fastbins.
2578 assert(prev_inuse(p));
2583 Properties of malloc_state.
2585 This may be useful for debugging malloc, as well as detecting user
2586 programmer errors that somehow write into malloc_state.
2588 If you are extending or experimenting with this malloc, you can
2589 probably figure out how to hack this routine to print out or
2590 display chunk addresses, sizes, bins, and other instrumentation.
2593 static void do_check_malloc_state(mstate av)
2595 int i;
2596 mchunkptr p;
2597 mchunkptr q;
2598 mbinptr b;
2599 unsigned int binbit;
2600 int empty;
2601 unsigned int idx;
2602 INTERNAL_SIZE_T size;
2603 unsigned long total = 0;
2604 int max_fast_bin;
2606 /* internal size_t must be no wider than pointer type */
2607 assert(sizeof(INTERNAL_SIZE_T) <= sizeof(char*));
2609 /* alignment is a power of 2 */
2610 assert((MALLOC_ALIGNMENT & (MALLOC_ALIGNMENT-1)) == 0);
2612 /* cannot run remaining checks until fully initialized */
2613 if (av->top == 0 || av->top == initial_top(av))
2614 return;
2616 /* pagesize is a power of 2 */
2617 assert((mp_.pagesize & (mp_.pagesize-1)) == 0);
2619 /* A contiguous main_arena is consistent with sbrk_base. */
2620 if (av == &main_arena && contiguous(av))
2621 assert((char*)mp_.sbrk_base + av->system_mem ==
2622 (char*)av->top + chunksize(av->top));
2624 /* properties of fastbins */
2626 /* max_fast is in allowed range */
2627 assert((av->max_fast & ~1) <= request2size(MAX_FAST_SIZE));
2629 max_fast_bin = fastbin_index(av->max_fast);
2631 for (i = 0; i < NFASTBINS; ++i) {
2632 p = av->fastbins[i];
2634 /* all bins past max_fast are empty */
2635 if (i > max_fast_bin)
2636 assert(p == 0);
2638 while (p != 0) {
2639 /* each chunk claims to be inuse */
2640 do_check_inuse_chunk(av, p);
2641 total += chunksize(p);
2642 /* chunk belongs in this bin */
2643 assert(fastbin_index(chunksize(p)) == i);
2644 p = p->fd;
2648 if (total != 0)
2649 assert(have_fastchunks(av));
2650 else if (!have_fastchunks(av))
2651 assert(total == 0);
2653 /* check normal bins */
2654 for (i = 1; i < NBINS; ++i) {
2655 b = bin_at(av,i);
2657 /* binmap is accurate (except for bin 1 == unsorted_chunks) */
2658 if (i >= 2) {
2659 binbit = get_binmap(av,i);
2660 empty = last(b) == b;
2661 if (!binbit)
2662 assert(empty);
2663 else if (!empty)
2664 assert(binbit);
2667 for (p = last(b); p != b; p = p->bk) {
2668 /* each chunk claims to be free */
2669 do_check_free_chunk(av, p);
2670 size = chunksize(p);
2671 total += size;
2672 if (i >= 2) {
2673 /* chunk belongs in bin */
2674 idx = bin_index(size);
2675 assert(idx == i);
2676 /* lists are sorted */
2677 assert(p->bk == b ||
2678 (unsigned long)chunksize(p->bk) >= (unsigned long)chunksize(p));
2680 /* chunk is followed by a legal chain of inuse chunks */
2681 for (q = next_chunk(p);
2682 (q != av->top && inuse(q) &&
2683 (unsigned long)(chunksize(q)) >= MINSIZE);
2684 q = next_chunk(q))
2685 do_check_inuse_chunk(av, q);
2689 /* top chunk is OK */
2690 check_chunk(av, av->top);
2692 /* sanity checks for statistics */
2694 #ifdef NO_THREADS
2695 assert(total <= (unsigned long)(mp_.max_total_mem));
2696 assert(mp_.n_mmaps >= 0);
2697 #endif
2698 assert(mp_.n_mmaps <= mp_.n_mmaps_max);
2699 assert(mp_.n_mmaps <= mp_.max_n_mmaps);
2701 assert((unsigned long)(av->system_mem) <=
2702 (unsigned long)(av->max_system_mem));
2704 assert((unsigned long)(mp_.mmapped_mem) <=
2705 (unsigned long)(mp_.max_mmapped_mem));
2707 #ifdef NO_THREADS
2708 assert((unsigned long)(mp_.max_total_mem) >=
2709 (unsigned long)(mp_.mmapped_mem) + (unsigned long)(av->system_mem));
2710 #endif
2712 #endif
2715 /* ----------------- Support for debugging hooks -------------------- */
2716 #include "hooks.c"
2719 /* ----------- Routines dealing with system allocation -------------- */
2722 sysmalloc handles malloc cases requiring more memory from the system.
2723 On entry, it is assumed that av->top does not have enough
2724 space to service request for nb bytes, thus requiring that av->top
2725 be extended or replaced.
2728 #if __STD_C
2729 static Void_t* sYSMALLOc(INTERNAL_SIZE_T nb, mstate av)
2730 #else
2731 static Void_t* sYSMALLOc(nb, av) INTERNAL_SIZE_T nb; mstate av;
2732 #endif
2734 mchunkptr old_top; /* incoming value of av->top */
2735 INTERNAL_SIZE_T old_size; /* its size */
2736 char* old_end; /* its end address */
2738 long size; /* arg to first MORECORE or mmap call */
2739 char* brk; /* return value from MORECORE */
2741 long correction; /* arg to 2nd MORECORE call */
2742 char* snd_brk; /* 2nd return val */
2744 INTERNAL_SIZE_T front_misalign; /* unusable bytes at front of new space */
2745 INTERNAL_SIZE_T end_misalign; /* partial page left at end of new space */
2746 char* aligned_brk; /* aligned offset into brk */
2748 mchunkptr p; /* the allocated/returned chunk */
2749 mchunkptr remainder; /* remainder from allocation */
2750 unsigned long remainder_size; /* its size */
2752 unsigned long sum; /* for updating stats */
2754 size_t pagemask = mp_.pagesize - 1;
2757 #if HAVE_MMAP
2760 If have mmap, and the request size meets the mmap threshold, and
2761 the system supports mmap, and there are few enough currently
2762 allocated mmapped regions, try to directly map this request
2763 rather than expanding top.
2766 if ((unsigned long)(nb) >= (unsigned long)(mp_.mmap_threshold) &&
2767 (mp_.n_mmaps < mp_.n_mmaps_max)) {
2769 char* mm; /* return value from mmap call*/
2772 Round up size to nearest page. For mmapped chunks, the overhead
2773 is one SIZE_SZ unit larger than for normal chunks, because there
2774 is no following chunk whose prev_size field could be used.
2776 size = (nb + SIZE_SZ + MALLOC_ALIGN_MASK + pagemask) & ~pagemask;
2778 /* Don't try if size wraps around 0 */
2779 if ((unsigned long)(size) > (unsigned long)(nb)) {
2781 mm = (char*)(MMAP(0, size, PROT_READ|PROT_WRITE, MAP_PRIVATE));
2783 if (mm != MAP_FAILED) {
2786 The offset to the start of the mmapped region is stored
2787 in the prev_size field of the chunk. This allows us to adjust
2788 returned start address to meet alignment requirements here
2789 and in memalign(), and still be able to compute proper
2790 address argument for later munmap in free() and realloc().
2793 front_misalign = (INTERNAL_SIZE_T)chunk2mem(mm) & MALLOC_ALIGN_MASK;
2794 if (front_misalign > 0) {
2795 correction = MALLOC_ALIGNMENT - front_misalign;
2796 p = (mchunkptr)(mm + correction);
2797 p->prev_size = correction;
2798 set_head(p, (size - correction) |IS_MMAPPED);
2800 else {
2801 p = (mchunkptr)mm;
2802 set_head(p, size|IS_MMAPPED);
2805 /* update statistics */
2807 if (++mp_.n_mmaps > mp_.max_n_mmaps)
2808 mp_.max_n_mmaps = mp_.n_mmaps;
2810 sum = mp_.mmapped_mem += size;
2811 if (sum > (unsigned long)(mp_.max_mmapped_mem))
2812 mp_.max_mmapped_mem = sum;
2813 #ifdef NO_THREADS
2814 sum += av->system_mem;
2815 if (sum > (unsigned long)(mp_.max_total_mem))
2816 mp_.max_total_mem = sum;
2817 #endif
2819 check_chunk(av, p);
2821 return chunk2mem(p);
2825 #endif
2827 /* Record incoming configuration of top */
2829 old_top = av->top;
2830 old_size = chunksize(old_top);
2831 old_end = (char*)(chunk_at_offset(old_top, old_size));
2833 brk = snd_brk = (char*)(MORECORE_FAILURE);
2836 If not the first time through, we require old_size to be
2837 at least MINSIZE and to have prev_inuse set.
2840 assert((old_top == initial_top(av) && old_size == 0) ||
2841 ((unsigned long) (old_size) >= MINSIZE &&
2842 prev_inuse(old_top) &&
2843 ((unsigned long)old_end & pagemask) == 0));
2845 /* Precondition: not enough current space to satisfy nb request */
2846 assert((unsigned long)(old_size) < (unsigned long)(nb + MINSIZE));
2848 /* Precondition: all fastbins are consolidated */
2849 assert(!have_fastchunks(av));
2852 if (av != &main_arena) {
2854 heap_info *old_heap, *heap;
2855 size_t old_heap_size;
2857 /* First try to extend the current heap. */
2858 old_heap = heap_for_ptr(old_top);
2859 old_heap_size = old_heap->size;
2860 if (grow_heap(old_heap, MINSIZE + nb - old_size) == 0) {
2861 av->system_mem += old_heap->size - old_heap_size;
2862 arena_mem += old_heap->size - old_heap_size;
2863 #if 0
2864 if(mmapped_mem + arena_mem + sbrked_mem > max_total_mem)
2865 max_total_mem = mmapped_mem + arena_mem + sbrked_mem;
2866 #endif
2867 set_head(old_top, (((char *)old_heap + old_heap->size) - (char *)old_top)
2868 | PREV_INUSE);
2870 else if ((heap = new_heap(nb + (MINSIZE + sizeof(*heap)), mp_.top_pad))) {
2871 /* Use a newly allocated heap. */
2872 heap->ar_ptr = av;
2873 heap->prev = old_heap;
2874 av->system_mem += heap->size;
2875 arena_mem += heap->size;
2876 #if 0
2877 if((unsigned long)(mmapped_mem + arena_mem + sbrked_mem) > max_total_mem)
2878 max_total_mem = mmapped_mem + arena_mem + sbrked_mem;
2879 #endif
2880 /* Set up the new top. */
2881 top(av) = chunk_at_offset(heap, sizeof(*heap));
2882 set_head(top(av), (heap->size - sizeof(*heap)) | PREV_INUSE);
2884 /* Setup fencepost and free the old top chunk. */
2885 /* The fencepost takes at least MINSIZE bytes, because it might
2886 become the top chunk again later. Note that a footer is set
2887 up, too, although the chunk is marked in use. */
2888 old_size -= MINSIZE;
2889 set_head(chunk_at_offset(old_top, old_size + 2*SIZE_SZ), 0|PREV_INUSE);
2890 if (old_size >= MINSIZE) {
2891 set_head(chunk_at_offset(old_top, old_size), (2*SIZE_SZ)|PREV_INUSE);
2892 set_foot(chunk_at_offset(old_top, old_size), (2*SIZE_SZ));
2893 set_head(old_top, old_size|PREV_INUSE|NON_MAIN_ARENA);
2894 _int_free(av, chunk2mem(old_top));
2895 } else {
2896 set_head(old_top, (old_size + 2*SIZE_SZ)|PREV_INUSE);
2897 set_foot(old_top, (old_size + 2*SIZE_SZ));
2901 } else { /* av == main_arena */
2904 /* Request enough space for nb + pad + overhead */
2906 size = nb + mp_.top_pad + MINSIZE;
2909 If contiguous, we can subtract out existing space that we hope to
2910 combine with new space. We add it back later only if
2911 we don't actually get contiguous space.
2914 if (contiguous(av))
2915 size -= old_size;
2918 Round to a multiple of page size.
2919 If MORECORE is not contiguous, this ensures that we only call it
2920 with whole-page arguments. And if MORECORE is contiguous and
2921 this is not first time through, this preserves page-alignment of
2922 previous calls. Otherwise, we correct to page-align below.
2925 size = (size + pagemask) & ~pagemask;
2928 Don't try to call MORECORE if argument is so big as to appear
2929 negative. Note that since mmap takes size_t arg, it may succeed
2930 below even if we cannot call MORECORE.
2933 if (size > 0)
2934 brk = (char*)(MORECORE(size));
2936 if (brk != (char*)(MORECORE_FAILURE)) {
2937 /* Call the `morecore' hook if necessary. */
2938 if (__after_morecore_hook)
2939 (*__after_morecore_hook) ();
2940 } else {
2942 If have mmap, try using it as a backup when MORECORE fails or
2943 cannot be used. This is worth doing on systems that have "holes" in
2944 address space, so sbrk cannot extend to give contiguous space, but
2945 space is available elsewhere. Note that we ignore mmap max count
2946 and threshold limits, since the space will not be used as a
2947 segregated mmap region.
2950 #if HAVE_MMAP
2951 /* Cannot merge with old top, so add its size back in */
2952 if (contiguous(av))
2953 size = (size + old_size + pagemask) & ~pagemask;
2955 /* If we are relying on mmap as backup, then use larger units */
2956 if ((unsigned long)(size) < (unsigned long)(MMAP_AS_MORECORE_SIZE))
2957 size = MMAP_AS_MORECORE_SIZE;
2959 /* Don't try if size wraps around 0 */
2960 if ((unsigned long)(size) > (unsigned long)(nb)) {
2962 char *mbrk = (char*)(MMAP(0, size, PROT_READ|PROT_WRITE, MAP_PRIVATE));
2964 if (mbrk != MAP_FAILED) {
2966 /* We do not need, and cannot use, another sbrk call to find end */
2967 brk = mbrk;
2968 snd_brk = brk + size;
2971 Record that we no longer have a contiguous sbrk region.
2972 After the first time mmap is used as backup, we do not
2973 ever rely on contiguous space since this could incorrectly
2974 bridge regions.
2976 set_noncontiguous(av);
2979 #endif
2982 if (brk != (char*)(MORECORE_FAILURE)) {
2983 if (mp_.sbrk_base == 0)
2984 mp_.sbrk_base = brk;
2985 av->system_mem += size;
2988 If MORECORE extends previous space, we can likewise extend top size.
2991 if (brk == old_end && snd_brk == (char*)(MORECORE_FAILURE))
2992 set_head(old_top, (size + old_size) | PREV_INUSE);
2994 else if (contiguous(av) && old_size && brk < old_end) {
2995 /* Oops! Someone else killed our space.. Can't touch anything. */
2996 assert(0);
3000 Otherwise, make adjustments:
3002 * If the first time through or noncontiguous, we need to call sbrk
3003 just to find out where the end of memory lies.
3005 * We need to ensure that all returned chunks from malloc will meet
3006 MALLOC_ALIGNMENT
3008 * If there was an intervening foreign sbrk, we need to adjust sbrk
3009 request size to account for fact that we will not be able to
3010 combine new space with existing space in old_top.
3012 * Almost all systems internally allocate whole pages at a time, in
3013 which case we might as well use the whole last page of request.
3014 So we allocate enough more memory to hit a page boundary now,
3015 which in turn causes future contiguous calls to page-align.
3018 else {
3019 front_misalign = 0;
3020 end_misalign = 0;
3021 correction = 0;
3022 aligned_brk = brk;
3024 /* handle contiguous cases */
3025 if (contiguous(av)) {
3027 /* Count foreign sbrk as system_mem. */
3028 if (old_size)
3029 av->system_mem += brk - old_end;
3031 /* Guarantee alignment of first new chunk made from this space */
3033 front_misalign = (INTERNAL_SIZE_T)chunk2mem(brk) & MALLOC_ALIGN_MASK;
3034 if (front_misalign > 0) {
3037 Skip over some bytes to arrive at an aligned position.
3038 We don't need to specially mark these wasted front bytes.
3039 They will never be accessed anyway because
3040 prev_inuse of av->top (and any chunk created from its start)
3041 is always true after initialization.
3044 correction = MALLOC_ALIGNMENT - front_misalign;
3045 aligned_brk += correction;
3049 If this isn't adjacent to existing space, then we will not
3050 be able to merge with old_top space, so must add to 2nd request.
3053 correction += old_size;
3055 /* Extend the end address to hit a page boundary */
3056 end_misalign = (INTERNAL_SIZE_T)(brk + size + correction);
3057 correction += ((end_misalign + pagemask) & ~pagemask) - end_misalign;
3059 assert(correction >= 0);
3060 snd_brk = (char*)(MORECORE(correction));
3063 If can't allocate correction, try to at least find out current
3064 brk. It might be enough to proceed without failing.
3066 Note that if second sbrk did NOT fail, we assume that space
3067 is contiguous with first sbrk. This is a safe assumption unless
3068 program is multithreaded but doesn't use locks and a foreign sbrk
3069 occurred between our first and second calls.
3072 if (snd_brk == (char*)(MORECORE_FAILURE)) {
3073 correction = 0;
3074 snd_brk = (char*)(MORECORE(0));
3075 } else
3076 /* Call the `morecore' hook if necessary. */
3077 if (__after_morecore_hook)
3078 (*__after_morecore_hook) ();
3081 /* handle non-contiguous cases */
3082 else {
3083 /* MORECORE/mmap must correctly align */
3084 assert(((unsigned long)chunk2mem(brk) & MALLOC_ALIGN_MASK) == 0);
3086 /* Find out current end of memory */
3087 if (snd_brk == (char*)(MORECORE_FAILURE)) {
3088 snd_brk = (char*)(MORECORE(0));
3092 /* Adjust top based on results of second sbrk */
3093 if (snd_brk != (char*)(MORECORE_FAILURE)) {
3094 av->top = (mchunkptr)aligned_brk;
3095 set_head(av->top, (snd_brk - aligned_brk + correction) | PREV_INUSE);
3096 av->system_mem += correction;
3099 If not the first time through, we either have a
3100 gap due to foreign sbrk or a non-contiguous region. Insert a
3101 double fencepost at old_top to prevent consolidation with space
3102 we don't own. These fenceposts are artificial chunks that are
3103 marked as inuse and are in any case too small to use. We need
3104 two to make sizes and alignments work out.
3107 if (old_size != 0) {
3109 Shrink old_top to insert fenceposts, keeping size a
3110 multiple of MALLOC_ALIGNMENT. We know there is at least
3111 enough space in old_top to do this.
3113 old_size = (old_size - 4*SIZE_SZ) & ~MALLOC_ALIGN_MASK;
3114 set_head(old_top, old_size | PREV_INUSE);
3117 Note that the following assignments completely overwrite
3118 old_top when old_size was previously MINSIZE. This is
3119 intentional. We need the fencepost, even if old_top otherwise gets
3120 lost.
3122 chunk_at_offset(old_top, old_size )->size =
3123 (2*SIZE_SZ)|PREV_INUSE;
3125 chunk_at_offset(old_top, old_size + 2*SIZE_SZ)->size =
3126 (2*SIZE_SZ)|PREV_INUSE;
3128 /* If possible, release the rest. */
3129 if (old_size >= MINSIZE) {
3130 _int_free(av, chunk2mem(old_top));
3137 /* Update statistics */
3138 #ifdef NO_THREADS
3139 sum = av->system_mem + mp_.mmapped_mem;
3140 if (sum > (unsigned long)(mp_.max_total_mem))
3141 mp_.max_total_mem = sum;
3142 #endif
3146 } /* if (av != &main_arena) */
3148 if ((unsigned long)av->system_mem > (unsigned long)(av->max_system_mem))
3149 av->max_system_mem = av->system_mem;
3150 check_malloc_state(av);
3152 /* finally, do the allocation */
3153 p = av->top;
3154 size = chunksize(p);
3156 /* check that one of the above allocation paths succeeded */
3157 if ((unsigned long)(size) >= (unsigned long)(nb + MINSIZE)) {
3158 remainder_size = size - nb;
3159 remainder = chunk_at_offset(p, nb);
3160 av->top = remainder;
3161 set_head(p, nb | PREV_INUSE | (av != &main_arena ? NON_MAIN_ARENA : 0));
3162 set_head(remainder, remainder_size | PREV_INUSE);
3163 check_malloced_chunk(av, p, nb);
3164 return chunk2mem(p);
3167 /* catch all failure paths */
3168 MALLOC_FAILURE_ACTION;
3169 return 0;
3174 sYSTRIm is an inverse of sorts to sYSMALLOc. It gives memory back
3175 to the system (via negative arguments to sbrk) if there is unused
3176 memory at the `high' end of the malloc pool. It is called
3177 automatically by free() when top space exceeds the trim
3178 threshold. It is also called by the public malloc_trim routine. It
3179 returns 1 if it actually released any memory, else 0.
3182 #if __STD_C
3183 static int sYSTRIm(size_t pad, mstate av)
3184 #else
3185 static int sYSTRIm(pad, av) size_t pad; mstate av;
3186 #endif
3188 long top_size; /* Amount of top-most memory */
3189 long extra; /* Amount to release */
3190 long released; /* Amount actually released */
3191 char* current_brk; /* address returned by pre-check sbrk call */
3192 char* new_brk; /* address returned by post-check sbrk call */
3193 size_t pagesz;
3195 pagesz = mp_.pagesize;
3196 top_size = chunksize(av->top);
3198 /* Release in pagesize units, keeping at least one page */
3199 extra = ((top_size - pad - MINSIZE + (pagesz-1)) / pagesz - 1) * pagesz;
3201 if (extra > 0) {
3204 Only proceed if end of memory is where we last set it.
3205 This avoids problems if there were foreign sbrk calls.
3207 current_brk = (char*)(MORECORE(0));
3208 if (current_brk == (char*)(av->top) + top_size) {
3211 Attempt to release memory. We ignore MORECORE return value,
3212 and instead call again to find out where new end of memory is.
3213 This avoids problems if first call releases less than we asked,
3214 of if failure somehow altered brk value. (We could still
3215 encounter problems if it altered brk in some very bad way,
3216 but the only thing we can do is adjust anyway, which will cause
3217 some downstream failure.)
3220 MORECORE(-extra);
3221 /* Call the `morecore' hook if necessary. */
3222 if (__after_morecore_hook)
3223 (*__after_morecore_hook) ();
3224 new_brk = (char*)(MORECORE(0));
3226 if (new_brk != (char*)MORECORE_FAILURE) {
3227 released = (long)(current_brk - new_brk);
3229 if (released != 0) {
3230 /* Success. Adjust top. */
3231 av->system_mem -= released;
3232 set_head(av->top, (top_size - released) | PREV_INUSE);
3233 check_malloc_state(av);
3234 return 1;
3239 return 0;
3242 #ifdef HAVE_MMAP
3244 static void
3245 internal_function
3246 #if __STD_C
3247 munmap_chunk(mchunkptr p)
3248 #else
3249 munmap_chunk(p) mchunkptr p;
3250 #endif
3252 INTERNAL_SIZE_T size = chunksize(p);
3253 int ret;
3255 assert (chunk_is_mmapped(p));
3256 #if 0
3257 assert(! ((char*)p >= mp_.sbrk_base && (char*)p < mp_.sbrk_base + mp_.sbrked_mem));
3258 assert((mp_.n_mmaps > 0));
3259 #endif
3260 assert(((p->prev_size + size) & (mp_.pagesize-1)) == 0);
3262 mp_.n_mmaps--;
3263 mp_.mmapped_mem -= (size + p->prev_size);
3265 ret = munmap((char *)p - p->prev_size, size + p->prev_size);
3267 /* munmap returns non-zero on failure */
3268 assert(ret == 0);
3271 #if HAVE_MREMAP
3273 static mchunkptr
3274 internal_function
3275 #if __STD_C
3276 mremap_chunk(mchunkptr p, size_t new_size)
3277 #else
3278 mremap_chunk(p, new_size) mchunkptr p; size_t new_size;
3279 #endif
3281 size_t page_mask = mp_.pagesize - 1;
3282 INTERNAL_SIZE_T offset = p->prev_size;
3283 INTERNAL_SIZE_T size = chunksize(p);
3284 char *cp;
3286 assert (chunk_is_mmapped(p));
3287 #if 0
3288 assert(! ((char*)p >= mp_.sbrk_base && (char*)p < mp_.sbrk_base + mp_.sbrked_mem));
3289 assert((mp_.n_mmaps > 0));
3290 #endif
3291 assert(((size + offset) & (mp_.pagesize-1)) == 0);
3293 /* Note the extra SIZE_SZ overhead as in mmap_chunk(). */
3294 new_size = (new_size + offset + SIZE_SZ + page_mask) & ~page_mask;
3296 cp = (char *)mremap((char *)p - offset, size + offset, new_size,
3297 MREMAP_MAYMOVE);
3299 if (cp == MAP_FAILED) return 0;
3301 p = (mchunkptr)(cp + offset);
3303 assert(aligned_OK(chunk2mem(p)));
3305 assert((p->prev_size == offset));
3306 set_head(p, (new_size - offset)|IS_MMAPPED);
3308 mp_.mmapped_mem -= size + offset;
3309 mp_.mmapped_mem += new_size;
3310 if ((unsigned long)mp_.mmapped_mem > (unsigned long)mp_.max_mmapped_mem)
3311 mp_.max_mmapped_mem = mp_.mmapped_mem;
3312 #ifdef NO_THREADS
3313 if ((unsigned long)(mp_.mmapped_mem + arena_mem + main_arena.system_mem) >
3314 mp_.max_total_mem)
3315 mp_.max_total_mem = mp_.mmapped_mem + arena_mem + main_arena.system_mem;
3316 #endif
3317 return p;
3320 #endif /* HAVE_MREMAP */
3322 #endif /* HAVE_MMAP */
3324 /*------------------------ Public wrappers. --------------------------------*/
3326 Void_t*
3327 public_mALLOc(size_t bytes)
3329 mstate ar_ptr;
3330 Void_t *victim;
3332 __malloc_ptr_t (*hook) (size_t, __const __malloc_ptr_t) = __malloc_hook;
3333 if (hook != NULL)
3334 return (*hook)(bytes, RETURN_ADDRESS (0));
3336 arena_get(ar_ptr, bytes);
3337 if(!ar_ptr)
3338 return 0;
3339 victim = _int_malloc(ar_ptr, bytes);
3340 if(!victim) {
3341 /* Maybe the failure is due to running out of mmapped areas. */
3342 if(ar_ptr != &main_arena) {
3343 (void)mutex_unlock(&ar_ptr->mutex);
3344 (void)mutex_lock(&main_arena.mutex);
3345 victim = _int_malloc(&main_arena, bytes);
3346 (void)mutex_unlock(&main_arena.mutex);
3347 } else {
3348 #if USE_ARENAS
3349 /* ... or sbrk() has failed and there is still a chance to mmap() */
3350 ar_ptr = arena_get2(ar_ptr->next ? ar_ptr : 0, bytes);
3351 (void)mutex_unlock(&main_arena.mutex);
3352 if(ar_ptr) {
3353 victim = _int_malloc(ar_ptr, bytes);
3354 (void)mutex_unlock(&ar_ptr->mutex);
3356 #endif
3358 } else
3359 (void)mutex_unlock(&ar_ptr->mutex);
3360 assert(!victim || chunk_is_mmapped(mem2chunk(victim)) ||
3361 ar_ptr == arena_for_chunk(mem2chunk(victim)));
3362 return victim;
3364 #ifdef libc_hidden_def
3365 libc_hidden_def(public_mALLOc)
3366 #endif
3368 void
3369 public_fREe(Void_t* mem)
3371 mstate ar_ptr;
3372 mchunkptr p; /* chunk corresponding to mem */
3374 void (*hook) (__malloc_ptr_t, __const __malloc_ptr_t) = __free_hook;
3375 if (hook != NULL) {
3376 (*hook)(mem, RETURN_ADDRESS (0));
3377 return;
3380 if (mem == 0) /* free(0) has no effect */
3381 return;
3383 p = mem2chunk(mem);
3385 #if HAVE_MMAP
3386 if (chunk_is_mmapped(p)) /* release mmapped memory. */
3388 munmap_chunk(p);
3389 return;
3391 #endif
3393 ar_ptr = arena_for_chunk(p);
3394 #if THREAD_STATS
3395 if(!mutex_trylock(&ar_ptr->mutex))
3396 ++(ar_ptr->stat_lock_direct);
3397 else {
3398 (void)mutex_lock(&ar_ptr->mutex);
3399 ++(ar_ptr->stat_lock_wait);
3401 #else
3402 (void)mutex_lock(&ar_ptr->mutex);
3403 #endif
3404 _int_free(ar_ptr, mem);
3405 (void)mutex_unlock(&ar_ptr->mutex);
3407 #ifdef libc_hidden_def
3408 libc_hidden_def (public_fREe)
3409 #endif
3411 Void_t*
3412 public_rEALLOc(Void_t* oldmem, size_t bytes)
3414 mstate ar_ptr;
3415 INTERNAL_SIZE_T nb; /* padded request size */
3417 mchunkptr oldp; /* chunk corresponding to oldmem */
3418 INTERNAL_SIZE_T oldsize; /* its size */
3420 Void_t* newp; /* chunk to return */
3422 __malloc_ptr_t (*hook) (__malloc_ptr_t, size_t, __const __malloc_ptr_t) =
3423 __realloc_hook;
3424 if (hook != NULL)
3425 return (*hook)(oldmem, bytes, RETURN_ADDRESS (0));
3427 #if REALLOC_ZERO_BYTES_FREES
3428 if (bytes == 0 && oldmem != NULL) { public_fREe(oldmem); return 0; }
3429 #endif
3431 /* realloc of null is supposed to be same as malloc */
3432 if (oldmem == 0) return public_mALLOc(bytes);
3434 oldp = mem2chunk(oldmem);
3435 oldsize = chunksize(oldp);
3437 /* Little security check which won't hurt performance: the
3438 allocator never wrapps around at the end of the address space.
3439 Therefore we can exclude some size values which might appear
3440 here by accident or by "design" from some intruder. */
3441 if (__builtin_expect ((uintptr_t) oldp > (uintptr_t) -oldsize, 0)
3442 || __builtin_expect ((uintptr_t) oldp & MALLOC_ALIGN_MASK, 0))
3444 malloc_printerr (check_action, "realloc(): invalid pointer", oldmem);
3445 return NULL;
3448 checked_request2size(bytes, nb);
3450 #if HAVE_MMAP
3451 if (chunk_is_mmapped(oldp))
3453 Void_t* newmem;
3455 #if HAVE_MREMAP
3456 newp = mremap_chunk(oldp, nb);
3457 if(newp) return chunk2mem(newp);
3458 #endif
3459 /* Note the extra SIZE_SZ overhead. */
3460 if(oldsize - SIZE_SZ >= nb) return oldmem; /* do nothing */
3461 /* Must alloc, copy, free. */
3462 newmem = public_mALLOc(bytes);
3463 if (newmem == 0) return 0; /* propagate failure */
3464 MALLOC_COPY(newmem, oldmem, oldsize - 2*SIZE_SZ);
3465 munmap_chunk(oldp);
3466 return newmem;
3468 #endif
3470 ar_ptr = arena_for_chunk(oldp);
3471 #if THREAD_STATS
3472 if(!mutex_trylock(&ar_ptr->mutex))
3473 ++(ar_ptr->stat_lock_direct);
3474 else {
3475 (void)mutex_lock(&ar_ptr->mutex);
3476 ++(ar_ptr->stat_lock_wait);
3478 #else
3479 (void)mutex_lock(&ar_ptr->mutex);
3480 #endif
3482 #ifndef NO_THREADS
3483 /* As in malloc(), remember this arena for the next allocation. */
3484 tsd_setspecific(arena_key, (Void_t *)ar_ptr);
3485 #endif
3487 newp = _int_realloc(ar_ptr, oldmem, bytes);
3489 (void)mutex_unlock(&ar_ptr->mutex);
3490 assert(!newp || chunk_is_mmapped(mem2chunk(newp)) ||
3491 ar_ptr == arena_for_chunk(mem2chunk(newp)));
3492 return newp;
3494 #ifdef libc_hidden_def
3495 libc_hidden_def (public_rEALLOc)
3496 #endif
3498 Void_t*
3499 public_mEMALIGn(size_t alignment, size_t bytes)
3501 mstate ar_ptr;
3502 Void_t *p;
3504 __malloc_ptr_t (*hook) __MALLOC_PMT ((size_t, size_t,
3505 __const __malloc_ptr_t)) =
3506 __memalign_hook;
3507 if (hook != NULL)
3508 return (*hook)(alignment, bytes, RETURN_ADDRESS (0));
3510 /* If need less alignment than we give anyway, just relay to malloc */
3511 if (alignment <= MALLOC_ALIGNMENT) return public_mALLOc(bytes);
3513 /* Otherwise, ensure that it is at least a minimum chunk size */
3514 if (alignment < MINSIZE) alignment = MINSIZE;
3516 arena_get(ar_ptr, bytes + alignment + MINSIZE);
3517 if(!ar_ptr)
3518 return 0;
3519 p = _int_memalign(ar_ptr, alignment, bytes);
3520 (void)mutex_unlock(&ar_ptr->mutex);
3521 if(!p) {
3522 /* Maybe the failure is due to running out of mmapped areas. */
3523 if(ar_ptr != &main_arena) {
3524 (void)mutex_lock(&main_arena.mutex);
3525 p = _int_memalign(&main_arena, alignment, bytes);
3526 (void)mutex_unlock(&main_arena.mutex);
3527 } else {
3528 #if USE_ARENAS
3529 /* ... or sbrk() has failed and there is still a chance to mmap() */
3530 ar_ptr = arena_get2(ar_ptr->next ? ar_ptr : 0, bytes);
3531 if(ar_ptr) {
3532 p = _int_memalign(ar_ptr, alignment, bytes);
3533 (void)mutex_unlock(&ar_ptr->mutex);
3535 #endif
3538 assert(!p || chunk_is_mmapped(mem2chunk(p)) ||
3539 ar_ptr == arena_for_chunk(mem2chunk(p)));
3540 return p;
3542 #ifdef libc_hidden_def
3543 libc_hidden_def (public_mEMALIGn)
3544 #endif
3546 Void_t*
3547 public_vALLOc(size_t bytes)
3549 mstate ar_ptr;
3550 Void_t *p;
3552 if(__malloc_initialized < 0)
3553 ptmalloc_init ();
3555 __malloc_ptr_t (*hook) __MALLOC_PMT ((size_t, size_t,
3556 __const __malloc_ptr_t)) =
3557 __memalign_hook;
3558 if (hook != NULL)
3559 return (*hook)(mp_.pagesize, bytes, RETURN_ADDRESS (0));
3561 arena_get(ar_ptr, bytes + mp_.pagesize + MINSIZE);
3562 if(!ar_ptr)
3563 return 0;
3564 p = _int_valloc(ar_ptr, bytes);
3565 (void)mutex_unlock(&ar_ptr->mutex);
3566 return p;
3569 Void_t*
3570 public_pVALLOc(size_t bytes)
3572 mstate ar_ptr;
3573 Void_t *p;
3575 if(__malloc_initialized < 0)
3576 ptmalloc_init ();
3578 __malloc_ptr_t (*hook) __MALLOC_PMT ((size_t, size_t,
3579 __const __malloc_ptr_t)) =
3580 __memalign_hook;
3581 if (hook != NULL)
3582 return (*hook)(mp_.pagesize,
3583 (bytes + mp_.pagesize - 1) & ~(mp_.pagesize - 1),
3584 RETURN_ADDRESS (0));
3586 arena_get(ar_ptr, bytes + 2*mp_.pagesize + MINSIZE);
3587 p = _int_pvalloc(ar_ptr, bytes);
3588 (void)mutex_unlock(&ar_ptr->mutex);
3589 return p;
3592 Void_t*
3593 public_cALLOc(size_t n, size_t elem_size)
3595 mstate av;
3596 mchunkptr oldtop, p;
3597 INTERNAL_SIZE_T bytes, sz, csz, oldtopsize;
3598 Void_t* mem;
3599 unsigned long clearsize;
3600 unsigned long nclears;
3601 INTERNAL_SIZE_T* d;
3602 __malloc_ptr_t (*hook) __MALLOC_PMT ((size_t, __const __malloc_ptr_t)) =
3603 __malloc_hook;
3605 /* size_t is unsigned so the behavior on overflow is defined. */
3606 bytes = n * elem_size;
3607 #define HALF_INTERNAL_SIZE_T \
3608 (((INTERNAL_SIZE_T) 1) << (8 * sizeof (INTERNAL_SIZE_T) / 2))
3609 if (__builtin_expect ((n | elem_size) >= HALF_INTERNAL_SIZE_T, 0)) {
3610 if (elem_size != 0 && bytes / elem_size != n) {
3611 MALLOC_FAILURE_ACTION;
3612 return 0;
3616 if (hook != NULL) {
3617 sz = bytes;
3618 mem = (*hook)(sz, RETURN_ADDRESS (0));
3619 if(mem == 0)
3620 return 0;
3621 #ifdef HAVE_MEMCPY
3622 return memset(mem, 0, sz);
3623 #else
3624 while(sz > 0) ((char*)mem)[--sz] = 0; /* rather inefficient */
3625 return mem;
3626 #endif
3629 sz = bytes;
3631 arena_get(av, sz);
3632 if(!av)
3633 return 0;
3635 /* Check if we hand out the top chunk, in which case there may be no
3636 need to clear. */
3637 #if MORECORE_CLEARS
3638 oldtop = top(av);
3639 oldtopsize = chunksize(top(av));
3640 #if MORECORE_CLEARS < 2
3641 /* Only newly allocated memory is guaranteed to be cleared. */
3642 if (av == &main_arena &&
3643 oldtopsize < mp_.sbrk_base + av->max_system_mem - (char *)oldtop)
3644 oldtopsize = (mp_.sbrk_base + av->max_system_mem - (char *)oldtop);
3645 #endif
3646 #endif
3647 mem = _int_malloc(av, sz);
3649 /* Only clearing follows, so we can unlock early. */
3650 (void)mutex_unlock(&av->mutex);
3652 assert(!mem || chunk_is_mmapped(mem2chunk(mem)) ||
3653 av == arena_for_chunk(mem2chunk(mem)));
3655 if (mem == 0) {
3656 /* Maybe the failure is due to running out of mmapped areas. */
3657 if(av != &main_arena) {
3658 (void)mutex_lock(&main_arena.mutex);
3659 mem = _int_malloc(&main_arena, sz);
3660 (void)mutex_unlock(&main_arena.mutex);
3661 } else {
3662 #if USE_ARENAS
3663 /* ... or sbrk() has failed and there is still a chance to mmap() */
3664 (void)mutex_lock(&main_arena.mutex);
3665 av = arena_get2(av->next ? av : 0, sz);
3666 (void)mutex_unlock(&main_arena.mutex);
3667 if(av) {
3668 mem = _int_malloc(av, sz);
3669 (void)mutex_unlock(&av->mutex);
3671 #endif
3673 if (mem == 0) return 0;
3675 p = mem2chunk(mem);
3677 /* Two optional cases in which clearing not necessary */
3678 #if HAVE_MMAP
3679 if (chunk_is_mmapped(p))
3680 return mem;
3681 #endif
3683 csz = chunksize(p);
3685 #if MORECORE_CLEARS
3686 if (p == oldtop && csz > oldtopsize) {
3687 /* clear only the bytes from non-freshly-sbrked memory */
3688 csz = oldtopsize;
3690 #endif
3692 /* Unroll clear of <= 36 bytes (72 if 8byte sizes). We know that
3693 contents have an odd number of INTERNAL_SIZE_T-sized words;
3694 minimally 3. */
3695 d = (INTERNAL_SIZE_T*)mem;
3696 clearsize = csz - SIZE_SZ;
3697 nclears = clearsize / sizeof(INTERNAL_SIZE_T);
3698 assert(nclears >= 3);
3700 if (nclears > 9)
3701 MALLOC_ZERO(d, clearsize);
3703 else {
3704 *(d+0) = 0;
3705 *(d+1) = 0;
3706 *(d+2) = 0;
3707 if (nclears > 4) {
3708 *(d+3) = 0;
3709 *(d+4) = 0;
3710 if (nclears > 6) {
3711 *(d+5) = 0;
3712 *(d+6) = 0;
3713 if (nclears > 8) {
3714 *(d+7) = 0;
3715 *(d+8) = 0;
3721 return mem;
3724 Void_t**
3725 public_iCALLOc(size_t n, size_t elem_size, Void_t** chunks)
3727 mstate ar_ptr;
3728 Void_t** m;
3730 arena_get(ar_ptr, n*elem_size);
3731 if(!ar_ptr)
3732 return 0;
3734 m = _int_icalloc(ar_ptr, n, elem_size, chunks);
3735 (void)mutex_unlock(&ar_ptr->mutex);
3736 return m;
3739 Void_t**
3740 public_iCOMALLOc(size_t n, size_t sizes[], Void_t** chunks)
3742 mstate ar_ptr;
3743 Void_t** m;
3745 arena_get(ar_ptr, 0);
3746 if(!ar_ptr)
3747 return 0;
3749 m = _int_icomalloc(ar_ptr, n, sizes, chunks);
3750 (void)mutex_unlock(&ar_ptr->mutex);
3751 return m;
3754 #ifndef _LIBC
3756 void
3757 public_cFREe(Void_t* m)
3759 public_fREe(m);
3762 #endif /* _LIBC */
3765 public_mTRIm(size_t s)
3767 int result;
3769 if(__malloc_initialized < 0)
3770 ptmalloc_init ();
3771 (void)mutex_lock(&main_arena.mutex);
3772 result = mTRIm(s);
3773 (void)mutex_unlock(&main_arena.mutex);
3774 return result;
3777 size_t
3778 public_mUSABLe(Void_t* m)
3780 size_t result;
3782 result = mUSABLe(m);
3783 return result;
3786 void
3787 public_mSTATs()
3789 mSTATs();
3792 struct mallinfo public_mALLINFo()
3794 struct mallinfo m;
3796 if(__malloc_initialized < 0)
3797 ptmalloc_init ();
3798 (void)mutex_lock(&main_arena.mutex);
3799 m = mALLINFo(&main_arena);
3800 (void)mutex_unlock(&main_arena.mutex);
3801 return m;
3805 public_mALLOPt(int p, int v)
3807 int result;
3808 result = mALLOPt(p, v);
3809 return result;
3813 ------------------------------ malloc ------------------------------
3816 Void_t*
3817 _int_malloc(mstate av, size_t bytes)
3819 INTERNAL_SIZE_T nb; /* normalized request size */
3820 unsigned int idx; /* associated bin index */
3821 mbinptr bin; /* associated bin */
3822 mfastbinptr* fb; /* associated fastbin */
3824 mchunkptr victim; /* inspected/selected chunk */
3825 INTERNAL_SIZE_T size; /* its size */
3826 int victim_index; /* its bin index */
3828 mchunkptr remainder; /* remainder from a split */
3829 unsigned long remainder_size; /* its size */
3831 unsigned int block; /* bit map traverser */
3832 unsigned int bit; /* bit map traverser */
3833 unsigned int map; /* current word of binmap */
3835 mchunkptr fwd; /* misc temp for linking */
3836 mchunkptr bck; /* misc temp for linking */
3839 Convert request size to internal form by adding SIZE_SZ bytes
3840 overhead plus possibly more to obtain necessary alignment and/or
3841 to obtain a size of at least MINSIZE, the smallest allocatable
3842 size. Also, checked_request2size traps (returning 0) request sizes
3843 that are so large that they wrap around zero when padded and
3844 aligned.
3847 checked_request2size(bytes, nb);
3850 If the size qualifies as a fastbin, first check corresponding bin.
3851 This code is safe to execute even if av is not yet initialized, so we
3852 can try it without checking, which saves some time on this fast path.
3855 if ((unsigned long)(nb) <= (unsigned long)(av->max_fast)) {
3856 long int idx = fastbin_index(nb);
3857 fb = &(av->fastbins[idx]);
3858 if ( (victim = *fb) != 0) {
3859 if (__builtin_expect (fastbin_index (chunksize (victim)) != idx, 0))
3860 malloc_printerr (check_action, "malloc(): memory corruption (fast)",
3861 chunk2mem (victim));
3862 *fb = victim->fd;
3863 check_remalloced_chunk(av, victim, nb);
3864 return chunk2mem(victim);
3869 If a small request, check regular bin. Since these "smallbins"
3870 hold one size each, no searching within bins is necessary.
3871 (For a large request, we need to wait until unsorted chunks are
3872 processed to find best fit. But for small ones, fits are exact
3873 anyway, so we can check now, which is faster.)
3876 if (in_smallbin_range(nb)) {
3877 idx = smallbin_index(nb);
3878 bin = bin_at(av,idx);
3880 if ( (victim = last(bin)) != bin) {
3881 if (victim == 0) /* initialization check */
3882 malloc_consolidate(av);
3883 else {
3884 bck = victim->bk;
3885 set_inuse_bit_at_offset(victim, nb);
3886 bin->bk = bck;
3887 bck->fd = bin;
3889 if (av != &main_arena)
3890 victim->size |= NON_MAIN_ARENA;
3891 check_malloced_chunk(av, victim, nb);
3892 return chunk2mem(victim);
3898 If this is a large request, consolidate fastbins before continuing.
3899 While it might look excessive to kill all fastbins before
3900 even seeing if there is space available, this avoids
3901 fragmentation problems normally associated with fastbins.
3902 Also, in practice, programs tend to have runs of either small or
3903 large requests, but less often mixtures, so consolidation is not
3904 invoked all that often in most programs. And the programs that
3905 it is called frequently in otherwise tend to fragment.
3908 else {
3909 idx = largebin_index(nb);
3910 if (have_fastchunks(av))
3911 malloc_consolidate(av);
3915 Process recently freed or remaindered chunks, taking one only if
3916 it is exact fit, or, if this a small request, the chunk is remainder from
3917 the most recent non-exact fit. Place other traversed chunks in
3918 bins. Note that this step is the only place in any routine where
3919 chunks are placed in bins.
3921 The outer loop here is needed because we might not realize until
3922 near the end of malloc that we should have consolidated, so must
3923 do so and retry. This happens at most once, and only when we would
3924 otherwise need to expand memory to service a "small" request.
3927 for(;;) {
3929 while ( (victim = unsorted_chunks(av)->bk) != unsorted_chunks(av)) {
3930 bck = victim->bk;
3931 if (__builtin_expect (victim->size <= 2 * SIZE_SZ, 0)
3932 || __builtin_expect (victim->size > av->system_mem, 0))
3933 malloc_printerr (check_action, "malloc(): memory corruption",
3934 chunk2mem (victim));
3935 size = chunksize(victim);
3938 If a small request, try to use last remainder if it is the
3939 only chunk in unsorted bin. This helps promote locality for
3940 runs of consecutive small requests. This is the only
3941 exception to best-fit, and applies only when there is
3942 no exact fit for a small chunk.
3945 if (in_smallbin_range(nb) &&
3946 bck == unsorted_chunks(av) &&
3947 victim == av->last_remainder &&
3948 (unsigned long)(size) > (unsigned long)(nb + MINSIZE)) {
3950 /* split and reattach remainder */
3951 remainder_size = size - nb;
3952 remainder = chunk_at_offset(victim, nb);
3953 unsorted_chunks(av)->bk = unsorted_chunks(av)->fd = remainder;
3954 av->last_remainder = remainder;
3955 remainder->bk = remainder->fd = unsorted_chunks(av);
3957 set_head(victim, nb | PREV_INUSE |
3958 (av != &main_arena ? NON_MAIN_ARENA : 0));
3959 set_head(remainder, remainder_size | PREV_INUSE);
3960 set_foot(remainder, remainder_size);
3962 check_malloced_chunk(av, victim, nb);
3963 return chunk2mem(victim);
3966 /* remove from unsorted list */
3967 unsorted_chunks(av)->bk = bck;
3968 bck->fd = unsorted_chunks(av);
3970 /* Take now instead of binning if exact fit */
3972 if (size == nb) {
3973 set_inuse_bit_at_offset(victim, size);
3974 if (av != &main_arena)
3975 victim->size |= NON_MAIN_ARENA;
3976 check_malloced_chunk(av, victim, nb);
3977 return chunk2mem(victim);
3980 /* place chunk in bin */
3982 if (in_smallbin_range(size)) {
3983 victim_index = smallbin_index(size);
3984 bck = bin_at(av, victim_index);
3985 fwd = bck->fd;
3987 else {
3988 victim_index = largebin_index(size);
3989 bck = bin_at(av, victim_index);
3990 fwd = bck->fd;
3992 /* maintain large bins in sorted order */
3993 if (fwd != bck) {
3994 /* Or with inuse bit to speed comparisons */
3995 size |= PREV_INUSE;
3996 /* if smaller than smallest, bypass loop below */
3997 assert((bck->bk->size & NON_MAIN_ARENA) == 0);
3998 if ((unsigned long)(size) <= (unsigned long)(bck->bk->size)) {
3999 fwd = bck;
4000 bck = bck->bk;
4002 else {
4003 assert((fwd->size & NON_MAIN_ARENA) == 0);
4004 while ((unsigned long)(size) < (unsigned long)(fwd->size)) {
4005 fwd = fwd->fd;
4006 assert((fwd->size & NON_MAIN_ARENA) == 0);
4008 bck = fwd->bk;
4013 mark_bin(av, victim_index);
4014 victim->bk = bck;
4015 victim->fd = fwd;
4016 fwd->bk = victim;
4017 bck->fd = victim;
4021 If a large request, scan through the chunks of current bin in
4022 sorted order to find smallest that fits. This is the only step
4023 where an unbounded number of chunks might be scanned without doing
4024 anything useful with them. However the lists tend to be short.
4027 if (!in_smallbin_range(nb)) {
4028 bin = bin_at(av, idx);
4030 /* skip scan if empty or largest chunk is too small */
4031 if ((victim = last(bin)) != bin &&
4032 (unsigned long)(first(bin)->size) >= (unsigned long)(nb)) {
4034 while (((unsigned long)(size = chunksize(victim)) <
4035 (unsigned long)(nb)))
4036 victim = victim->bk;
4038 remainder_size = size - nb;
4039 unlink(victim, bck, fwd);
4041 /* Exhaust */
4042 if (remainder_size < MINSIZE) {
4043 set_inuse_bit_at_offset(victim, size);
4044 if (av != &main_arena)
4045 victim->size |= NON_MAIN_ARENA;
4046 check_malloced_chunk(av, victim, nb);
4047 return chunk2mem(victim);
4049 /* Split */
4050 else {
4051 remainder = chunk_at_offset(victim, nb);
4052 unsorted_chunks(av)->bk = unsorted_chunks(av)->fd = remainder;
4053 remainder->bk = remainder->fd = unsorted_chunks(av);
4054 set_head(victim, nb | PREV_INUSE |
4055 (av != &main_arena ? NON_MAIN_ARENA : 0));
4056 set_head(remainder, remainder_size | PREV_INUSE);
4057 set_foot(remainder, remainder_size);
4058 check_malloced_chunk(av, victim, nb);
4059 return chunk2mem(victim);
4065 Search for a chunk by scanning bins, starting with next largest
4066 bin. This search is strictly by best-fit; i.e., the smallest
4067 (with ties going to approximately the least recently used) chunk
4068 that fits is selected.
4070 The bitmap avoids needing to check that most blocks are nonempty.
4071 The particular case of skipping all bins during warm-up phases
4072 when no chunks have been returned yet is faster than it might look.
4075 ++idx;
4076 bin = bin_at(av,idx);
4077 block = idx2block(idx);
4078 map = av->binmap[block];
4079 bit = idx2bit(idx);
4081 for (;;) {
4083 /* Skip rest of block if there are no more set bits in this block. */
4084 if (bit > map || bit == 0) {
4085 do {
4086 if (++block >= BINMAPSIZE) /* out of bins */
4087 goto use_top;
4088 } while ( (map = av->binmap[block]) == 0);
4090 bin = bin_at(av, (block << BINMAPSHIFT));
4091 bit = 1;
4094 /* Advance to bin with set bit. There must be one. */
4095 while ((bit & map) == 0) {
4096 bin = next_bin(bin);
4097 bit <<= 1;
4098 assert(bit != 0);
4101 /* Inspect the bin. It is likely to be non-empty */
4102 victim = last(bin);
4104 /* If a false alarm (empty bin), clear the bit. */
4105 if (victim == bin) {
4106 av->binmap[block] = map &= ~bit; /* Write through */
4107 bin = next_bin(bin);
4108 bit <<= 1;
4111 else {
4112 size = chunksize(victim);
4114 /* We know the first chunk in this bin is big enough to use. */
4115 assert((unsigned long)(size) >= (unsigned long)(nb));
4117 remainder_size = size - nb;
4119 /* unlink */
4120 bck = victim->bk;
4121 bin->bk = bck;
4122 bck->fd = bin;
4124 /* Exhaust */
4125 if (remainder_size < MINSIZE) {
4126 set_inuse_bit_at_offset(victim, size);
4127 if (av != &main_arena)
4128 victim->size |= NON_MAIN_ARENA;
4129 check_malloced_chunk(av, victim, nb);
4130 return chunk2mem(victim);
4133 /* Split */
4134 else {
4135 remainder = chunk_at_offset(victim, nb);
4137 unsorted_chunks(av)->bk = unsorted_chunks(av)->fd = remainder;
4138 remainder->bk = remainder->fd = unsorted_chunks(av);
4139 /* advertise as last remainder */
4140 if (in_smallbin_range(nb))
4141 av->last_remainder = remainder;
4143 set_head(victim, nb | PREV_INUSE |
4144 (av != &main_arena ? NON_MAIN_ARENA : 0));
4145 set_head(remainder, remainder_size | PREV_INUSE);
4146 set_foot(remainder, remainder_size);
4147 check_malloced_chunk(av, victim, nb);
4148 return chunk2mem(victim);
4153 use_top:
4155 If large enough, split off the chunk bordering the end of memory
4156 (held in av->top). Note that this is in accord with the best-fit
4157 search rule. In effect, av->top is treated as larger (and thus
4158 less well fitting) than any other available chunk since it can
4159 be extended to be as large as necessary (up to system
4160 limitations).
4162 We require that av->top always exists (i.e., has size >=
4163 MINSIZE) after initialization, so if it would otherwise be
4164 exhuasted by current request, it is replenished. (The main
4165 reason for ensuring it exists is that we may need MINSIZE space
4166 to put in fenceposts in sysmalloc.)
4169 victim = av->top;
4170 size = chunksize(victim);
4172 if ((unsigned long)(size) >= (unsigned long)(nb + MINSIZE)) {
4173 remainder_size = size - nb;
4174 remainder = chunk_at_offset(victim, nb);
4175 av->top = remainder;
4176 set_head(victim, nb | PREV_INUSE |
4177 (av != &main_arena ? NON_MAIN_ARENA : 0));
4178 set_head(remainder, remainder_size | PREV_INUSE);
4180 check_malloced_chunk(av, victim, nb);
4181 return chunk2mem(victim);
4185 If there is space available in fastbins, consolidate and retry,
4186 to possibly avoid expanding memory. This can occur only if nb is
4187 in smallbin range so we didn't consolidate upon entry.
4190 else if (have_fastchunks(av)) {
4191 assert(in_smallbin_range(nb));
4192 malloc_consolidate(av);
4193 idx = smallbin_index(nb); /* restore original bin index */
4197 Otherwise, relay to handle system-dependent cases
4199 else
4200 return sYSMALLOc(nb, av);
4205 ------------------------------ free ------------------------------
4208 void
4209 _int_free(mstate av, Void_t* mem)
4211 mchunkptr p; /* chunk corresponding to mem */
4212 INTERNAL_SIZE_T size; /* its size */
4213 mfastbinptr* fb; /* associated fastbin */
4214 mchunkptr nextchunk; /* next contiguous chunk */
4215 INTERNAL_SIZE_T nextsize; /* its size */
4216 int nextinuse; /* true if nextchunk is used */
4217 INTERNAL_SIZE_T prevsize; /* size of previous contiguous chunk */
4218 mchunkptr bck; /* misc temp for linking */
4219 mchunkptr fwd; /* misc temp for linking */
4221 const char *errstr = NULL;
4223 p = mem2chunk(mem);
4224 size = chunksize(p);
4226 /* Little security check which won't hurt performance: the
4227 allocator never wrapps around at the end of the address space.
4228 Therefore we can exclude some size values which might appear
4229 here by accident or by "design" from some intruder. */
4230 if (__builtin_expect ((uintptr_t) p > (uintptr_t) -size, 0)
4231 || __builtin_expect ((uintptr_t) p & MALLOC_ALIGN_MASK, 0))
4233 errstr = "free(): invalid pointer";
4234 errout:
4235 malloc_printerr (check_action, errstr, mem);
4236 return;
4239 check_inuse_chunk(av, p);
4242 If eligible, place chunk on a fastbin so it can be found
4243 and used quickly in malloc.
4246 if ((unsigned long)(size) <= (unsigned long)(av->max_fast)
4248 #if TRIM_FASTBINS
4250 If TRIM_FASTBINS set, don't place chunks
4251 bordering top into fastbins
4253 && (chunk_at_offset(p, size) != av->top)
4254 #endif
4257 if (__builtin_expect (chunk_at_offset (p, size)->size <= 2 * SIZE_SZ, 0)
4258 || __builtin_expect (chunksize (chunk_at_offset (p, size))
4259 >= av->system_mem, 0))
4261 errstr = "free(): invalid next size (fast)";
4262 goto errout;
4265 set_fastchunks(av);
4266 fb = &(av->fastbins[fastbin_index(size)]);
4267 /* Another simple check: make sure the top of the bin is not the
4268 record we are going to add (i.e., double free). */
4269 if (__builtin_expect (*fb == p, 0))
4271 errstr = "double free or corruption (fasttop)";
4272 goto errout;
4274 p->fd = *fb;
4275 *fb = p;
4279 Consolidate other non-mmapped chunks as they arrive.
4282 else if (!chunk_is_mmapped(p)) {
4283 nextchunk = chunk_at_offset(p, size);
4285 /* Lightweight tests: check whether the block is already the
4286 top block. */
4287 if (__builtin_expect (p == av->top, 0))
4289 errstr = "double free or corruption (top)";
4290 goto errout;
4292 /* Or whether the next chunk is beyond the boundaries of the arena. */
4293 if (__builtin_expect (contiguous (av)
4294 && (char *) nextchunk
4295 >= ((char *) av->top + chunksize(av->top)), 0))
4297 errstr = "double free or corruption (out)";
4298 goto errout;
4300 /* Or whether the block is actually not marked used. */
4301 if (__builtin_expect (!prev_inuse(nextchunk), 0))
4303 errstr = "double free or corruption (!prev)";
4304 goto errout;
4307 nextsize = chunksize(nextchunk);
4308 if (__builtin_expect (nextchunk->size <= 2 * SIZE_SZ, 0)
4309 || __builtin_expect (nextsize >= av->system_mem, 0))
4311 errstr = "free(): invalid next size (normal)";
4312 goto errout;
4315 /* consolidate backward */
4316 if (!prev_inuse(p)) {
4317 prevsize = p->prev_size;
4318 size += prevsize;
4319 p = chunk_at_offset(p, -((long) prevsize));
4320 unlink(p, bck, fwd);
4323 if (nextchunk != av->top) {
4324 /* get and clear inuse bit */
4325 nextinuse = inuse_bit_at_offset(nextchunk, nextsize);
4327 /* consolidate forward */
4328 if (!nextinuse) {
4329 unlink(nextchunk, bck, fwd);
4330 size += nextsize;
4331 } else
4332 clear_inuse_bit_at_offset(nextchunk, 0);
4335 Place the chunk in unsorted chunk list. Chunks are
4336 not placed into regular bins until after they have
4337 been given one chance to be used in malloc.
4340 bck = unsorted_chunks(av);
4341 fwd = bck->fd;
4342 p->bk = bck;
4343 p->fd = fwd;
4344 bck->fd = p;
4345 fwd->bk = p;
4347 set_head(p, size | PREV_INUSE);
4348 set_foot(p, size);
4350 check_free_chunk(av, p);
4354 If the chunk borders the current high end of memory,
4355 consolidate into top
4358 else {
4359 size += nextsize;
4360 set_head(p, size | PREV_INUSE);
4361 av->top = p;
4362 check_chunk(av, p);
4366 If freeing a large space, consolidate possibly-surrounding
4367 chunks. Then, if the total unused topmost memory exceeds trim
4368 threshold, ask malloc_trim to reduce top.
4370 Unless max_fast is 0, we don't know if there are fastbins
4371 bordering top, so we cannot tell for sure whether threshold
4372 has been reached unless fastbins are consolidated. But we
4373 don't want to consolidate on each free. As a compromise,
4374 consolidation is performed if FASTBIN_CONSOLIDATION_THRESHOLD
4375 is reached.
4378 if ((unsigned long)(size) >= FASTBIN_CONSOLIDATION_THRESHOLD) {
4379 if (have_fastchunks(av))
4380 malloc_consolidate(av);
4382 if (av == &main_arena) {
4383 #ifndef MORECORE_CANNOT_TRIM
4384 if ((unsigned long)(chunksize(av->top)) >=
4385 (unsigned long)(mp_.trim_threshold))
4386 sYSTRIm(mp_.top_pad, av);
4387 #endif
4388 } else {
4389 /* Always try heap_trim(), even if the top chunk is not
4390 large, because the corresponding heap might go away. */
4391 heap_info *heap = heap_for_ptr(top(av));
4393 assert(heap->ar_ptr == av);
4394 heap_trim(heap, mp_.top_pad);
4400 If the chunk was allocated via mmap, release via munmap(). Note
4401 that if HAVE_MMAP is false but chunk_is_mmapped is true, then
4402 user must have overwritten memory. There's nothing we can do to
4403 catch this error unless MALLOC_DEBUG is set, in which case
4404 check_inuse_chunk (above) will have triggered error.
4407 else {
4408 #if HAVE_MMAP
4409 munmap_chunk (p);
4410 #endif
4415 ------------------------- malloc_consolidate -------------------------
4417 malloc_consolidate is a specialized version of free() that tears
4418 down chunks held in fastbins. Free itself cannot be used for this
4419 purpose since, among other things, it might place chunks back onto
4420 fastbins. So, instead, we need to use a minor variant of the same
4421 code.
4423 Also, because this routine needs to be called the first time through
4424 malloc anyway, it turns out to be the perfect place to trigger
4425 initialization code.
4428 #if __STD_C
4429 static void malloc_consolidate(mstate av)
4430 #else
4431 static void malloc_consolidate(av) mstate av;
4432 #endif
4434 mfastbinptr* fb; /* current fastbin being consolidated */
4435 mfastbinptr* maxfb; /* last fastbin (for loop control) */
4436 mchunkptr p; /* current chunk being consolidated */
4437 mchunkptr nextp; /* next chunk to consolidate */
4438 mchunkptr unsorted_bin; /* bin header */
4439 mchunkptr first_unsorted; /* chunk to link to */
4441 /* These have same use as in free() */
4442 mchunkptr nextchunk;
4443 INTERNAL_SIZE_T size;
4444 INTERNAL_SIZE_T nextsize;
4445 INTERNAL_SIZE_T prevsize;
4446 int nextinuse;
4447 mchunkptr bck;
4448 mchunkptr fwd;
4451 If max_fast is 0, we know that av hasn't
4452 yet been initialized, in which case do so below
4455 if (av->max_fast != 0) {
4456 clear_fastchunks(av);
4458 unsorted_bin = unsorted_chunks(av);
4461 Remove each chunk from fast bin and consolidate it, placing it
4462 then in unsorted bin. Among other reasons for doing this,
4463 placing in unsorted bin avoids needing to calculate actual bins
4464 until malloc is sure that chunks aren't immediately going to be
4465 reused anyway.
4468 maxfb = &(av->fastbins[fastbin_index(av->max_fast)]);
4469 fb = &(av->fastbins[0]);
4470 do {
4471 if ( (p = *fb) != 0) {
4472 *fb = 0;
4474 do {
4475 check_inuse_chunk(av, p);
4476 nextp = p->fd;
4478 /* Slightly streamlined version of consolidation code in free() */
4479 size = p->size & ~(PREV_INUSE|NON_MAIN_ARENA);
4480 nextchunk = chunk_at_offset(p, size);
4481 nextsize = chunksize(nextchunk);
4483 if (!prev_inuse(p)) {
4484 prevsize = p->prev_size;
4485 size += prevsize;
4486 p = chunk_at_offset(p, -((long) prevsize));
4487 unlink(p, bck, fwd);
4490 if (nextchunk != av->top) {
4491 nextinuse = inuse_bit_at_offset(nextchunk, nextsize);
4493 if (!nextinuse) {
4494 size += nextsize;
4495 unlink(nextchunk, bck, fwd);
4496 } else
4497 clear_inuse_bit_at_offset(nextchunk, 0);
4499 first_unsorted = unsorted_bin->fd;
4500 unsorted_bin->fd = p;
4501 first_unsorted->bk = p;
4503 set_head(p, size | PREV_INUSE);
4504 p->bk = unsorted_bin;
4505 p->fd = first_unsorted;
4506 set_foot(p, size);
4509 else {
4510 size += nextsize;
4511 set_head(p, size | PREV_INUSE);
4512 av->top = p;
4515 } while ( (p = nextp) != 0);
4518 } while (fb++ != maxfb);
4520 else {
4521 malloc_init_state(av);
4522 check_malloc_state(av);
4527 ------------------------------ realloc ------------------------------
4530 Void_t*
4531 _int_realloc(mstate av, Void_t* oldmem, size_t bytes)
4533 INTERNAL_SIZE_T nb; /* padded request size */
4535 mchunkptr oldp; /* chunk corresponding to oldmem */
4536 INTERNAL_SIZE_T oldsize; /* its size */
4538 mchunkptr newp; /* chunk to return */
4539 INTERNAL_SIZE_T newsize; /* its size */
4540 Void_t* newmem; /* corresponding user mem */
4542 mchunkptr next; /* next contiguous chunk after oldp */
4544 mchunkptr remainder; /* extra space at end of newp */
4545 unsigned long remainder_size; /* its size */
4547 mchunkptr bck; /* misc temp for linking */
4548 mchunkptr fwd; /* misc temp for linking */
4550 unsigned long copysize; /* bytes to copy */
4551 unsigned int ncopies; /* INTERNAL_SIZE_T words to copy */
4552 INTERNAL_SIZE_T* s; /* copy source */
4553 INTERNAL_SIZE_T* d; /* copy destination */
4555 const char *errstr = NULL;
4558 checked_request2size(bytes, nb);
4560 oldp = mem2chunk(oldmem);
4561 oldsize = chunksize(oldp);
4563 /* Simple tests for old block integrity. */
4564 if (__builtin_expect ((uintptr_t) oldp & MALLOC_ALIGN_MASK, 0))
4566 errstr = "realloc(): invalid pointer";
4567 errout:
4568 malloc_printerr (check_action, errstr, oldmem);
4569 return NULL;
4571 if (__builtin_expect (oldp->size <= 2 * SIZE_SZ, 0)
4572 || __builtin_expect (oldsize >= av->system_mem, 0))
4574 errstr = "realloc(): invalid size";
4575 goto errout;
4578 check_inuse_chunk(av, oldp);
4580 if (!chunk_is_mmapped(oldp)) {
4582 next = chunk_at_offset(oldp, oldsize);
4583 INTERNAL_SIZE_T nextsize = chunksize(next);
4584 if (__builtin_expect (next->size <= 2 * SIZE_SZ, 0)
4585 || __builtin_expect (nextsize >= av->system_mem, 0))
4587 errstr = "realloc(): invalid next size";
4588 goto errout;
4591 if ((unsigned long)(oldsize) >= (unsigned long)(nb)) {
4592 /* already big enough; split below */
4593 newp = oldp;
4594 newsize = oldsize;
4597 else {
4598 /* Try to expand forward into top */
4599 if (next == av->top &&
4600 (unsigned long)(newsize = oldsize + nextsize) >=
4601 (unsigned long)(nb + MINSIZE)) {
4602 set_head_size(oldp, nb | (av != &main_arena ? NON_MAIN_ARENA : 0));
4603 av->top = chunk_at_offset(oldp, nb);
4604 set_head(av->top, (newsize - nb) | PREV_INUSE);
4605 check_inuse_chunk(av, oldp);
4606 return chunk2mem(oldp);
4609 /* Try to expand forward into next chunk; split off remainder below */
4610 else if (next != av->top &&
4611 !inuse(next) &&
4612 (unsigned long)(newsize = oldsize + nextsize) >=
4613 (unsigned long)(nb)) {
4614 newp = oldp;
4615 unlink(next, bck, fwd);
4618 /* allocate, copy, free */
4619 else {
4620 newmem = _int_malloc(av, nb - MALLOC_ALIGN_MASK);
4621 if (newmem == 0)
4622 return 0; /* propagate failure */
4624 newp = mem2chunk(newmem);
4625 newsize = chunksize(newp);
4628 Avoid copy if newp is next chunk after oldp.
4630 if (newp == next) {
4631 newsize += oldsize;
4632 newp = oldp;
4634 else {
4636 Unroll copy of <= 36 bytes (72 if 8byte sizes)
4637 We know that contents have an odd number of
4638 INTERNAL_SIZE_T-sized words; minimally 3.
4641 copysize = oldsize - SIZE_SZ;
4642 s = (INTERNAL_SIZE_T*)(oldmem);
4643 d = (INTERNAL_SIZE_T*)(newmem);
4644 ncopies = copysize / sizeof(INTERNAL_SIZE_T);
4645 assert(ncopies >= 3);
4647 if (ncopies > 9)
4648 MALLOC_COPY(d, s, copysize);
4650 else {
4651 *(d+0) = *(s+0);
4652 *(d+1) = *(s+1);
4653 *(d+2) = *(s+2);
4654 if (ncopies > 4) {
4655 *(d+3) = *(s+3);
4656 *(d+4) = *(s+4);
4657 if (ncopies > 6) {
4658 *(d+5) = *(s+5);
4659 *(d+6) = *(s+6);
4660 if (ncopies > 8) {
4661 *(d+7) = *(s+7);
4662 *(d+8) = *(s+8);
4668 _int_free(av, oldmem);
4669 check_inuse_chunk(av, newp);
4670 return chunk2mem(newp);
4675 /* If possible, free extra space in old or extended chunk */
4677 assert((unsigned long)(newsize) >= (unsigned long)(nb));
4679 remainder_size = newsize - nb;
4681 if (remainder_size < MINSIZE) { /* not enough extra to split off */
4682 set_head_size(newp, newsize | (av != &main_arena ? NON_MAIN_ARENA : 0));
4683 set_inuse_bit_at_offset(newp, newsize);
4685 else { /* split remainder */
4686 remainder = chunk_at_offset(newp, nb);
4687 set_head_size(newp, nb | (av != &main_arena ? NON_MAIN_ARENA : 0));
4688 set_head(remainder, remainder_size | PREV_INUSE |
4689 (av != &main_arena ? NON_MAIN_ARENA : 0));
4690 /* Mark remainder as inuse so free() won't complain */
4691 set_inuse_bit_at_offset(remainder, remainder_size);
4692 _int_free(av, chunk2mem(remainder));
4695 check_inuse_chunk(av, newp);
4696 return chunk2mem(newp);
4700 Handle mmap cases
4703 else {
4704 #if HAVE_MMAP
4706 #if HAVE_MREMAP
4707 INTERNAL_SIZE_T offset = oldp->prev_size;
4708 size_t pagemask = mp_.pagesize - 1;
4709 char *cp;
4710 unsigned long sum;
4712 /* Note the extra SIZE_SZ overhead */
4713 newsize = (nb + offset + SIZE_SZ + pagemask) & ~pagemask;
4715 /* don't need to remap if still within same page */
4716 if (oldsize == newsize - offset)
4717 return oldmem;
4719 cp = (char*)mremap((char*)oldp - offset, oldsize + offset, newsize, 1);
4721 if (cp != MAP_FAILED) {
4723 newp = (mchunkptr)(cp + offset);
4724 set_head(newp, (newsize - offset)|IS_MMAPPED);
4726 assert(aligned_OK(chunk2mem(newp)));
4727 assert((newp->prev_size == offset));
4729 /* update statistics */
4730 sum = mp_.mmapped_mem += newsize - oldsize;
4731 if (sum > (unsigned long)(mp_.max_mmapped_mem))
4732 mp_.max_mmapped_mem = sum;
4733 #ifdef NO_THREADS
4734 sum += main_arena.system_mem;
4735 if (sum > (unsigned long)(mp_.max_total_mem))
4736 mp_.max_total_mem = sum;
4737 #endif
4739 return chunk2mem(newp);
4741 #endif
4743 /* Note the extra SIZE_SZ overhead. */
4744 if ((unsigned long)(oldsize) >= (unsigned long)(nb + SIZE_SZ))
4745 newmem = oldmem; /* do nothing */
4746 else {
4747 /* Must alloc, copy, free. */
4748 newmem = _int_malloc(av, nb - MALLOC_ALIGN_MASK);
4749 if (newmem != 0) {
4750 MALLOC_COPY(newmem, oldmem, oldsize - 2*SIZE_SZ);
4751 _int_free(av, oldmem);
4754 return newmem;
4756 #else
4757 /* If !HAVE_MMAP, but chunk_is_mmapped, user must have overwritten mem */
4758 check_malloc_state(av);
4759 MALLOC_FAILURE_ACTION;
4760 return 0;
4761 #endif
4766 ------------------------------ memalign ------------------------------
4769 Void_t*
4770 _int_memalign(mstate av, size_t alignment, size_t bytes)
4772 INTERNAL_SIZE_T nb; /* padded request size */
4773 char* m; /* memory returned by malloc call */
4774 mchunkptr p; /* corresponding chunk */
4775 char* brk; /* alignment point within p */
4776 mchunkptr newp; /* chunk to return */
4777 INTERNAL_SIZE_T newsize; /* its size */
4778 INTERNAL_SIZE_T leadsize; /* leading space before alignment point */
4779 mchunkptr remainder; /* spare room at end to split off */
4780 unsigned long remainder_size; /* its size */
4781 INTERNAL_SIZE_T size;
4783 /* If need less alignment than we give anyway, just relay to malloc */
4785 if (alignment <= MALLOC_ALIGNMENT) return _int_malloc(av, bytes);
4787 /* Otherwise, ensure that it is at least a minimum chunk size */
4789 if (alignment < MINSIZE) alignment = MINSIZE;
4791 /* Make sure alignment is power of 2 (in case MINSIZE is not). */
4792 if ((alignment & (alignment - 1)) != 0) {
4793 size_t a = MALLOC_ALIGNMENT * 2;
4794 while ((unsigned long)a < (unsigned long)alignment) a <<= 1;
4795 alignment = a;
4798 checked_request2size(bytes, nb);
4801 Strategy: find a spot within that chunk that meets the alignment
4802 request, and then possibly free the leading and trailing space.
4806 /* Call malloc with worst case padding to hit alignment. */
4808 m = (char*)(_int_malloc(av, nb + alignment + MINSIZE));
4810 if (m == 0) return 0; /* propagate failure */
4812 p = mem2chunk(m);
4814 if ((((unsigned long)(m)) % alignment) != 0) { /* misaligned */
4817 Find an aligned spot inside chunk. Since we need to give back
4818 leading space in a chunk of at least MINSIZE, if the first
4819 calculation places us at a spot with less than MINSIZE leader,
4820 we can move to the next aligned spot -- we've allocated enough
4821 total room so that this is always possible.
4824 brk = (char*)mem2chunk(((unsigned long)(m + alignment - 1)) &
4825 -((signed long) alignment));
4826 if ((unsigned long)(brk - (char*)(p)) < MINSIZE)
4827 brk += alignment;
4829 newp = (mchunkptr)brk;
4830 leadsize = brk - (char*)(p);
4831 newsize = chunksize(p) - leadsize;
4833 /* For mmapped chunks, just adjust offset */
4834 if (chunk_is_mmapped(p)) {
4835 newp->prev_size = p->prev_size + leadsize;
4836 set_head(newp, newsize|IS_MMAPPED);
4837 return chunk2mem(newp);
4840 /* Otherwise, give back leader, use the rest */
4841 set_head(newp, newsize | PREV_INUSE |
4842 (av != &main_arena ? NON_MAIN_ARENA : 0));
4843 set_inuse_bit_at_offset(newp, newsize);
4844 set_head_size(p, leadsize | (av != &main_arena ? NON_MAIN_ARENA : 0));
4845 _int_free(av, chunk2mem(p));
4846 p = newp;
4848 assert (newsize >= nb &&
4849 (((unsigned long)(chunk2mem(p))) % alignment) == 0);
4852 /* Also give back spare room at the end */
4853 if (!chunk_is_mmapped(p)) {
4854 size = chunksize(p);
4855 if ((unsigned long)(size) > (unsigned long)(nb + MINSIZE)) {
4856 remainder_size = size - nb;
4857 remainder = chunk_at_offset(p, nb);
4858 set_head(remainder, remainder_size | PREV_INUSE |
4859 (av != &main_arena ? NON_MAIN_ARENA : 0));
4860 set_head_size(p, nb);
4861 _int_free(av, chunk2mem(remainder));
4865 check_inuse_chunk(av, p);
4866 return chunk2mem(p);
4869 #if 0
4871 ------------------------------ calloc ------------------------------
4874 #if __STD_C
4875 Void_t* cALLOc(size_t n_elements, size_t elem_size)
4876 #else
4877 Void_t* cALLOc(n_elements, elem_size) size_t n_elements; size_t elem_size;
4878 #endif
4880 mchunkptr p;
4881 unsigned long clearsize;
4882 unsigned long nclears;
4883 INTERNAL_SIZE_T* d;
4885 Void_t* mem = mALLOc(n_elements * elem_size);
4887 if (mem != 0) {
4888 p = mem2chunk(mem);
4890 #if MMAP_CLEARS
4891 if (!chunk_is_mmapped(p)) /* don't need to clear mmapped space */
4892 #endif
4895 Unroll clear of <= 36 bytes (72 if 8byte sizes)
4896 We know that contents have an odd number of
4897 INTERNAL_SIZE_T-sized words; minimally 3.
4900 d = (INTERNAL_SIZE_T*)mem;
4901 clearsize = chunksize(p) - SIZE_SZ;
4902 nclears = clearsize / sizeof(INTERNAL_SIZE_T);
4903 assert(nclears >= 3);
4905 if (nclears > 9)
4906 MALLOC_ZERO(d, clearsize);
4908 else {
4909 *(d+0) = 0;
4910 *(d+1) = 0;
4911 *(d+2) = 0;
4912 if (nclears > 4) {
4913 *(d+3) = 0;
4914 *(d+4) = 0;
4915 if (nclears > 6) {
4916 *(d+5) = 0;
4917 *(d+6) = 0;
4918 if (nclears > 8) {
4919 *(d+7) = 0;
4920 *(d+8) = 0;
4927 return mem;
4929 #endif /* 0 */
4932 ------------------------- independent_calloc -------------------------
4935 Void_t**
4936 #if __STD_C
4937 _int_icalloc(mstate av, size_t n_elements, size_t elem_size, Void_t* chunks[])
4938 #else
4939 _int_icalloc(av, n_elements, elem_size, chunks)
4940 mstate av; size_t n_elements; size_t elem_size; Void_t* chunks[];
4941 #endif
4943 size_t sz = elem_size; /* serves as 1-element array */
4944 /* opts arg of 3 means all elements are same size, and should be cleared */
4945 return iALLOc(av, n_elements, &sz, 3, chunks);
4949 ------------------------- independent_comalloc -------------------------
4952 Void_t**
4953 #if __STD_C
4954 _int_icomalloc(mstate av, size_t n_elements, size_t sizes[], Void_t* chunks[])
4955 #else
4956 _int_icomalloc(av, n_elements, sizes, chunks)
4957 mstate av; size_t n_elements; size_t sizes[]; Void_t* chunks[];
4958 #endif
4960 return iALLOc(av, n_elements, sizes, 0, chunks);
4965 ------------------------------ ialloc ------------------------------
4966 ialloc provides common support for independent_X routines, handling all of
4967 the combinations that can result.
4969 The opts arg has:
4970 bit 0 set if all elements are same size (using sizes[0])
4971 bit 1 set if elements should be zeroed
4975 static Void_t**
4976 #if __STD_C
4977 iALLOc(mstate av, size_t n_elements, size_t* sizes, int opts, Void_t* chunks[])
4978 #else
4979 iALLOc(av, n_elements, sizes, opts, chunks)
4980 mstate av; size_t n_elements; size_t* sizes; int opts; Void_t* chunks[];
4981 #endif
4983 INTERNAL_SIZE_T element_size; /* chunksize of each element, if all same */
4984 INTERNAL_SIZE_T contents_size; /* total size of elements */
4985 INTERNAL_SIZE_T array_size; /* request size of pointer array */
4986 Void_t* mem; /* malloced aggregate space */
4987 mchunkptr p; /* corresponding chunk */
4988 INTERNAL_SIZE_T remainder_size; /* remaining bytes while splitting */
4989 Void_t** marray; /* either "chunks" or malloced ptr array */
4990 mchunkptr array_chunk; /* chunk for malloced ptr array */
4991 int mmx; /* to disable mmap */
4992 INTERNAL_SIZE_T size;
4993 INTERNAL_SIZE_T size_flags;
4994 size_t i;
4996 /* Ensure initialization/consolidation */
4997 if (have_fastchunks(av)) malloc_consolidate(av);
4999 /* compute array length, if needed */
5000 if (chunks != 0) {
5001 if (n_elements == 0)
5002 return chunks; /* nothing to do */
5003 marray = chunks;
5004 array_size = 0;
5006 else {
5007 /* if empty req, must still return chunk representing empty array */
5008 if (n_elements == 0)
5009 return (Void_t**) _int_malloc(av, 0);
5010 marray = 0;
5011 array_size = request2size(n_elements * (sizeof(Void_t*)));
5014 /* compute total element size */
5015 if (opts & 0x1) { /* all-same-size */
5016 element_size = request2size(*sizes);
5017 contents_size = n_elements * element_size;
5019 else { /* add up all the sizes */
5020 element_size = 0;
5021 contents_size = 0;
5022 for (i = 0; i != n_elements; ++i)
5023 contents_size += request2size(sizes[i]);
5026 /* subtract out alignment bytes from total to minimize overallocation */
5027 size = contents_size + array_size - MALLOC_ALIGN_MASK;
5030 Allocate the aggregate chunk.
5031 But first disable mmap so malloc won't use it, since
5032 we would not be able to later free/realloc space internal
5033 to a segregated mmap region.
5035 mmx = mp_.n_mmaps_max; /* disable mmap */
5036 mp_.n_mmaps_max = 0;
5037 mem = _int_malloc(av, size);
5038 mp_.n_mmaps_max = mmx; /* reset mmap */
5039 if (mem == 0)
5040 return 0;
5042 p = mem2chunk(mem);
5043 assert(!chunk_is_mmapped(p));
5044 remainder_size = chunksize(p);
5046 if (opts & 0x2) { /* optionally clear the elements */
5047 MALLOC_ZERO(mem, remainder_size - SIZE_SZ - array_size);
5050 size_flags = PREV_INUSE | (av != &main_arena ? NON_MAIN_ARENA : 0);
5052 /* If not provided, allocate the pointer array as final part of chunk */
5053 if (marray == 0) {
5054 array_chunk = chunk_at_offset(p, contents_size);
5055 marray = (Void_t**) (chunk2mem(array_chunk));
5056 set_head(array_chunk, (remainder_size - contents_size) | size_flags);
5057 remainder_size = contents_size;
5060 /* split out elements */
5061 for (i = 0; ; ++i) {
5062 marray[i] = chunk2mem(p);
5063 if (i != n_elements-1) {
5064 if (element_size != 0)
5065 size = element_size;
5066 else
5067 size = request2size(sizes[i]);
5068 remainder_size -= size;
5069 set_head(p, size | size_flags);
5070 p = chunk_at_offset(p, size);
5072 else { /* the final element absorbs any overallocation slop */
5073 set_head(p, remainder_size | size_flags);
5074 break;
5078 #if MALLOC_DEBUG
5079 if (marray != chunks) {
5080 /* final element must have exactly exhausted chunk */
5081 if (element_size != 0)
5082 assert(remainder_size == element_size);
5083 else
5084 assert(remainder_size == request2size(sizes[i]));
5085 check_inuse_chunk(av, mem2chunk(marray));
5088 for (i = 0; i != n_elements; ++i)
5089 check_inuse_chunk(av, mem2chunk(marray[i]));
5090 #endif
5092 return marray;
5097 ------------------------------ valloc ------------------------------
5100 Void_t*
5101 #if __STD_C
5102 _int_valloc(mstate av, size_t bytes)
5103 #else
5104 _int_valloc(av, bytes) mstate av; size_t bytes;
5105 #endif
5107 /* Ensure initialization/consolidation */
5108 if (have_fastchunks(av)) malloc_consolidate(av);
5109 return _int_memalign(av, mp_.pagesize, bytes);
5113 ------------------------------ pvalloc ------------------------------
5117 Void_t*
5118 #if __STD_C
5119 _int_pvalloc(mstate av, size_t bytes)
5120 #else
5121 _int_pvalloc(av, bytes) mstate av, size_t bytes;
5122 #endif
5124 size_t pagesz;
5126 /* Ensure initialization/consolidation */
5127 if (have_fastchunks(av)) malloc_consolidate(av);
5128 pagesz = mp_.pagesize;
5129 return _int_memalign(av, pagesz, (bytes + pagesz - 1) & ~(pagesz - 1));
5134 ------------------------------ malloc_trim ------------------------------
5137 #if __STD_C
5138 int mTRIm(size_t pad)
5139 #else
5140 int mTRIm(pad) size_t pad;
5141 #endif
5143 mstate av = &main_arena; /* already locked */
5145 /* Ensure initialization/consolidation */
5146 malloc_consolidate(av);
5148 #ifndef MORECORE_CANNOT_TRIM
5149 return sYSTRIm(pad, av);
5150 #else
5151 return 0;
5152 #endif
5157 ------------------------- malloc_usable_size -------------------------
5160 #if __STD_C
5161 size_t mUSABLe(Void_t* mem)
5162 #else
5163 size_t mUSABLe(mem) Void_t* mem;
5164 #endif
5166 mchunkptr p;
5167 if (mem != 0) {
5168 p = mem2chunk(mem);
5169 if (chunk_is_mmapped(p))
5170 return chunksize(p) - 2*SIZE_SZ;
5171 else if (inuse(p))
5172 return chunksize(p) - SIZE_SZ;
5174 return 0;
5178 ------------------------------ mallinfo ------------------------------
5181 struct mallinfo mALLINFo(mstate av)
5183 struct mallinfo mi;
5184 size_t i;
5185 mbinptr b;
5186 mchunkptr p;
5187 INTERNAL_SIZE_T avail;
5188 INTERNAL_SIZE_T fastavail;
5189 int nblocks;
5190 int nfastblocks;
5192 /* Ensure initialization */
5193 if (av->top == 0) malloc_consolidate(av);
5195 check_malloc_state(av);
5197 /* Account for top */
5198 avail = chunksize(av->top);
5199 nblocks = 1; /* top always exists */
5201 /* traverse fastbins */
5202 nfastblocks = 0;
5203 fastavail = 0;
5205 for (i = 0; i < NFASTBINS; ++i) {
5206 for (p = av->fastbins[i]; p != 0; p = p->fd) {
5207 ++nfastblocks;
5208 fastavail += chunksize(p);
5212 avail += fastavail;
5214 /* traverse regular bins */
5215 for (i = 1; i < NBINS; ++i) {
5216 b = bin_at(av, i);
5217 for (p = last(b); p != b; p = p->bk) {
5218 ++nblocks;
5219 avail += chunksize(p);
5223 mi.smblks = nfastblocks;
5224 mi.ordblks = nblocks;
5225 mi.fordblks = avail;
5226 mi.uordblks = av->system_mem - avail;
5227 mi.arena = av->system_mem;
5228 mi.hblks = mp_.n_mmaps;
5229 mi.hblkhd = mp_.mmapped_mem;
5230 mi.fsmblks = fastavail;
5231 mi.keepcost = chunksize(av->top);
5232 mi.usmblks = mp_.max_total_mem;
5233 return mi;
5237 ------------------------------ malloc_stats ------------------------------
5240 void mSTATs()
5242 int i;
5243 mstate ar_ptr;
5244 struct mallinfo mi;
5245 unsigned int in_use_b = mp_.mmapped_mem, system_b = in_use_b;
5246 #if THREAD_STATS
5247 long stat_lock_direct = 0, stat_lock_loop = 0, stat_lock_wait = 0;
5248 #endif
5250 if(__malloc_initialized < 0)
5251 ptmalloc_init ();
5252 #ifdef _LIBC
5253 _IO_flockfile (stderr);
5254 int old_flags2 = ((_IO_FILE *) stderr)->_flags2;
5255 ((_IO_FILE *) stderr)->_flags2 |= _IO_FLAGS2_NOTCANCEL;
5256 #endif
5257 for (i=0, ar_ptr = &main_arena;; i++) {
5258 (void)mutex_lock(&ar_ptr->mutex);
5259 mi = mALLINFo(ar_ptr);
5260 fprintf(stderr, "Arena %d:\n", i);
5261 fprintf(stderr, "system bytes = %10u\n", (unsigned int)mi.arena);
5262 fprintf(stderr, "in use bytes = %10u\n", (unsigned int)mi.uordblks);
5263 #if MALLOC_DEBUG > 1
5264 if (i > 0)
5265 dump_heap(heap_for_ptr(top(ar_ptr)));
5266 #endif
5267 system_b += mi.arena;
5268 in_use_b += mi.uordblks;
5269 #if THREAD_STATS
5270 stat_lock_direct += ar_ptr->stat_lock_direct;
5271 stat_lock_loop += ar_ptr->stat_lock_loop;
5272 stat_lock_wait += ar_ptr->stat_lock_wait;
5273 #endif
5274 (void)mutex_unlock(&ar_ptr->mutex);
5275 ar_ptr = ar_ptr->next;
5276 if(ar_ptr == &main_arena) break;
5278 #if HAVE_MMAP
5279 fprintf(stderr, "Total (incl. mmap):\n");
5280 #else
5281 fprintf(stderr, "Total:\n");
5282 #endif
5283 fprintf(stderr, "system bytes = %10u\n", system_b);
5284 fprintf(stderr, "in use bytes = %10u\n", in_use_b);
5285 #ifdef NO_THREADS
5286 fprintf(stderr, "max system bytes = %10u\n", (unsigned int)mp_.max_total_mem);
5287 #endif
5288 #if HAVE_MMAP
5289 fprintf(stderr, "max mmap regions = %10u\n", (unsigned int)mp_.max_n_mmaps);
5290 fprintf(stderr, "max mmap bytes = %10lu\n",
5291 (unsigned long)mp_.max_mmapped_mem);
5292 #endif
5293 #if THREAD_STATS
5294 fprintf(stderr, "heaps created = %10d\n", stat_n_heaps);
5295 fprintf(stderr, "locked directly = %10ld\n", stat_lock_direct);
5296 fprintf(stderr, "locked in loop = %10ld\n", stat_lock_loop);
5297 fprintf(stderr, "locked waiting = %10ld\n", stat_lock_wait);
5298 fprintf(stderr, "locked total = %10ld\n",
5299 stat_lock_direct + stat_lock_loop + stat_lock_wait);
5300 #endif
5301 #ifdef _LIBC
5302 ((_IO_FILE *) stderr)->_flags2 |= old_flags2;
5303 _IO_funlockfile (stderr);
5304 #endif
5309 ------------------------------ mallopt ------------------------------
5312 #if __STD_C
5313 int mALLOPt(int param_number, int value)
5314 #else
5315 int mALLOPt(param_number, value) int param_number; int value;
5316 #endif
5318 mstate av = &main_arena;
5319 int res = 1;
5321 if(__malloc_initialized < 0)
5322 ptmalloc_init ();
5323 (void)mutex_lock(&av->mutex);
5324 /* Ensure initialization/consolidation */
5325 malloc_consolidate(av);
5327 switch(param_number) {
5328 case M_MXFAST:
5329 if (value >= 0 && value <= MAX_FAST_SIZE) {
5330 set_max_fast(av, value);
5332 else
5333 res = 0;
5334 break;
5336 case M_TRIM_THRESHOLD:
5337 mp_.trim_threshold = value;
5338 break;
5340 case M_TOP_PAD:
5341 mp_.top_pad = value;
5342 break;
5344 case M_MMAP_THRESHOLD:
5345 #if USE_ARENAS
5346 /* Forbid setting the threshold too high. */
5347 if((unsigned long)value > HEAP_MAX_SIZE/2)
5348 res = 0;
5349 else
5350 #endif
5351 mp_.mmap_threshold = value;
5352 break;
5354 case M_MMAP_MAX:
5355 #if !HAVE_MMAP
5356 if (value != 0)
5357 res = 0;
5358 else
5359 #endif
5360 mp_.n_mmaps_max = value;
5361 break;
5363 case M_CHECK_ACTION:
5364 check_action = value;
5365 break;
5367 (void)mutex_unlock(&av->mutex);
5368 return res;
5373 -------------------- Alternative MORECORE functions --------------------
5378 General Requirements for MORECORE.
5380 The MORECORE function must have the following properties:
5382 If MORECORE_CONTIGUOUS is false:
5384 * MORECORE must allocate in multiples of pagesize. It will
5385 only be called with arguments that are multiples of pagesize.
5387 * MORECORE(0) must return an address that is at least
5388 MALLOC_ALIGNMENT aligned. (Page-aligning always suffices.)
5390 else (i.e. If MORECORE_CONTIGUOUS is true):
5392 * Consecutive calls to MORECORE with positive arguments
5393 return increasing addresses, indicating that space has been
5394 contiguously extended.
5396 * MORECORE need not allocate in multiples of pagesize.
5397 Calls to MORECORE need not have args of multiples of pagesize.
5399 * MORECORE need not page-align.
5401 In either case:
5403 * MORECORE may allocate more memory than requested. (Or even less,
5404 but this will generally result in a malloc failure.)
5406 * MORECORE must not allocate memory when given argument zero, but
5407 instead return one past the end address of memory from previous
5408 nonzero call. This malloc does NOT call MORECORE(0)
5409 until at least one call with positive arguments is made, so
5410 the initial value returned is not important.
5412 * Even though consecutive calls to MORECORE need not return contiguous
5413 addresses, it must be OK for malloc'ed chunks to span multiple
5414 regions in those cases where they do happen to be contiguous.
5416 * MORECORE need not handle negative arguments -- it may instead
5417 just return MORECORE_FAILURE when given negative arguments.
5418 Negative arguments are always multiples of pagesize. MORECORE
5419 must not misinterpret negative args as large positive unsigned
5420 args. You can suppress all such calls from even occurring by defining
5421 MORECORE_CANNOT_TRIM,
5423 There is some variation across systems about the type of the
5424 argument to sbrk/MORECORE. If size_t is unsigned, then it cannot
5425 actually be size_t, because sbrk supports negative args, so it is
5426 normally the signed type of the same width as size_t (sometimes
5427 declared as "intptr_t", and sometimes "ptrdiff_t"). It doesn't much
5428 matter though. Internally, we use "long" as arguments, which should
5429 work across all reasonable possibilities.
5431 Additionally, if MORECORE ever returns failure for a positive
5432 request, and HAVE_MMAP is true, then mmap is used as a noncontiguous
5433 system allocator. This is a useful backup strategy for systems with
5434 holes in address spaces -- in this case sbrk cannot contiguously
5435 expand the heap, but mmap may be able to map noncontiguous space.
5437 If you'd like mmap to ALWAYS be used, you can define MORECORE to be
5438 a function that always returns MORECORE_FAILURE.
5440 If you are using this malloc with something other than sbrk (or its
5441 emulation) to supply memory regions, you probably want to set
5442 MORECORE_CONTIGUOUS as false. As an example, here is a custom
5443 allocator kindly contributed for pre-OSX macOS. It uses virtually
5444 but not necessarily physically contiguous non-paged memory (locked
5445 in, present and won't get swapped out). You can use it by
5446 uncommenting this section, adding some #includes, and setting up the
5447 appropriate defines above:
5449 #define MORECORE osMoreCore
5450 #define MORECORE_CONTIGUOUS 0
5452 There is also a shutdown routine that should somehow be called for
5453 cleanup upon program exit.
5455 #define MAX_POOL_ENTRIES 100
5456 #define MINIMUM_MORECORE_SIZE (64 * 1024)
5457 static int next_os_pool;
5458 void *our_os_pools[MAX_POOL_ENTRIES];
5460 void *osMoreCore(int size)
5462 void *ptr = 0;
5463 static void *sbrk_top = 0;
5465 if (size > 0)
5467 if (size < MINIMUM_MORECORE_SIZE)
5468 size = MINIMUM_MORECORE_SIZE;
5469 if (CurrentExecutionLevel() == kTaskLevel)
5470 ptr = PoolAllocateResident(size + RM_PAGE_SIZE, 0);
5471 if (ptr == 0)
5473 return (void *) MORECORE_FAILURE;
5475 // save ptrs so they can be freed during cleanup
5476 our_os_pools[next_os_pool] = ptr;
5477 next_os_pool++;
5478 ptr = (void *) ((((unsigned long) ptr) + RM_PAGE_MASK) & ~RM_PAGE_MASK);
5479 sbrk_top = (char *) ptr + size;
5480 return ptr;
5482 else if (size < 0)
5484 // we don't currently support shrink behavior
5485 return (void *) MORECORE_FAILURE;
5487 else
5489 return sbrk_top;
5493 // cleanup any allocated memory pools
5494 // called as last thing before shutting down driver
5496 void osCleanupMem(void)
5498 void **ptr;
5500 for (ptr = our_os_pools; ptr < &our_os_pools[MAX_POOL_ENTRIES]; ptr++)
5501 if (*ptr)
5503 PoolDeallocate(*ptr);
5504 *ptr = 0;
5511 /* Helper code. */
5513 static void
5514 malloc_printerr(int action, const char *str, void *ptr)
5516 if (action & 1)
5518 char buf[2 * sizeof (uintptr_t) + 1];
5520 buf[sizeof (buf) - 1] = '\0';
5521 char *cp = _itoa_word ((uintptr_t) ptr, &buf[sizeof (buf) - 1], 16, 0);
5522 while (cp > buf)
5523 *--cp = '0';
5525 __libc_message (action & 2,
5526 action & 4
5527 ? "%s\n" : "*** glibc detected *** %s: 0x%s ***\n",
5528 str, cp);
5530 else if (action & 2)
5531 abort ();
5534 #ifdef _LIBC
5535 # include <sys/param.h>
5537 /* We need a wrapper function for one of the additions of POSIX. */
5539 __posix_memalign (void **memptr, size_t alignment, size_t size)
5541 void *mem;
5542 __malloc_ptr_t (*hook) __MALLOC_PMT ((size_t, size_t,
5543 __const __malloc_ptr_t)) =
5544 __memalign_hook;
5546 /* Test whether the SIZE argument is valid. It must be a power of
5547 two multiple of sizeof (void *). */
5548 if (alignment % sizeof (void *) != 0
5549 || !powerof2 (alignment / sizeof (void *)) != 0
5550 || alignment == 0)
5551 return EINVAL;
5553 /* Call the hook here, so that caller is posix_memalign's caller
5554 and not posix_memalign itself. */
5555 if (hook != NULL)
5556 mem = (*hook)(alignment, size, RETURN_ADDRESS (0));
5557 else
5558 mem = public_mEMALIGn (alignment, size);
5560 if (mem != NULL) {
5561 *memptr = mem;
5562 return 0;
5565 return ENOMEM;
5567 weak_alias (__posix_memalign, posix_memalign)
5569 strong_alias (__libc_calloc, __calloc) weak_alias (__libc_calloc, calloc)
5570 strong_alias (__libc_free, __cfree) weak_alias (__libc_free, cfree)
5571 strong_alias (__libc_free, __free) strong_alias (__libc_free, free)
5572 strong_alias (__libc_malloc, __malloc) strong_alias (__libc_malloc, malloc)
5573 strong_alias (__libc_memalign, __memalign)
5574 weak_alias (__libc_memalign, memalign)
5575 strong_alias (__libc_realloc, __realloc) strong_alias (__libc_realloc, realloc)
5576 strong_alias (__libc_valloc, __valloc) weak_alias (__libc_valloc, valloc)
5577 strong_alias (__libc_pvalloc, __pvalloc) weak_alias (__libc_pvalloc, pvalloc)
5578 strong_alias (__libc_mallinfo, __mallinfo)
5579 weak_alias (__libc_mallinfo, mallinfo)
5580 strong_alias (__libc_mallopt, __mallopt) weak_alias (__libc_mallopt, mallopt)
5582 weak_alias (__malloc_stats, malloc_stats)
5583 weak_alias (__malloc_usable_size, malloc_usable_size)
5584 weak_alias (__malloc_trim, malloc_trim)
5585 weak_alias (__malloc_get_state, malloc_get_state)
5586 weak_alias (__malloc_set_state, malloc_set_state)
5588 #endif /* _LIBC */
5590 /* ------------------------------------------------------------
5591 History:
5593 [see ftp://g.oswego.edu/pub/misc/malloc.c for the history of dlmalloc]
5597 * Local variables:
5598 * c-basic-offset: 2
5599 * End: