Home | History | Annotate | Download | only in internal
      1 /******************************************************************************/
      2 #ifdef JEMALLOC_H_TYPES
      3 
      4 #define	LARGE_MINCLASS		(ZU(1) << LG_LARGE_MINCLASS)
      5 
      6 /* Maximum number of regions in one run. */
      7 #define	LG_RUN_MAXREGS		(LG_PAGE - LG_TINY_MIN)
      8 #define	RUN_MAXREGS		(1U << LG_RUN_MAXREGS)
      9 
     10 /*
     11  * Minimum redzone size.  Redzones may be larger than this if necessary to
     12  * preserve region alignment.
     13  */
     14 #define	REDZONE_MINSIZE		16
     15 
     16 /*
     17  * The minimum ratio of active:dirty pages per arena is computed as:
     18  *
     19  *   (nactive >> lg_dirty_mult) >= ndirty
     20  *
     21  * So, supposing that lg_dirty_mult is 3, there can be no less than 8 times as
     22  * many active pages as dirty pages.
     23  */
     24 #define	LG_DIRTY_MULT_DEFAULT	3
     25 
     26 typedef enum {
     27 	purge_mode_ratio = 0,
     28 	purge_mode_decay = 1,
     29 
     30 	purge_mode_limit = 2
     31 } purge_mode_t;
     32 /* ANDROID change */
     33 /* Use the decay mode purge method. By setting the DECAY_TIME_DEFAULT to
     34  * zero, this forces all pages to be purged as soon as they are not in use.
     35  */
     36 #define	PURGE_DEFAULT		purge_mode_decay
     37 /* Default decay time in seconds. */
     38 #define	DECAY_TIME_DEFAULT	0
     39 /* End ANDROID change */
     40 /* Number of event ticks between time checks. */
     41 #define	DECAY_NTICKS_PER_UPDATE	1000
     42 
     43 typedef struct arena_runs_dirty_link_s arena_runs_dirty_link_t;
     44 typedef struct arena_run_s arena_run_t;
     45 typedef struct arena_chunk_map_bits_s arena_chunk_map_bits_t;
     46 typedef struct arena_chunk_map_misc_s arena_chunk_map_misc_t;
     47 typedef struct arena_chunk_s arena_chunk_t;
     48 typedef struct arena_bin_info_s arena_bin_info_t;
     49 typedef struct arena_bin_s arena_bin_t;
     50 typedef struct arena_s arena_t;
     51 typedef struct arena_tdata_s arena_tdata_t;
     52 
     53 #endif /* JEMALLOC_H_TYPES */
     54 /******************************************************************************/
     55 #ifdef JEMALLOC_H_STRUCTS
     56 
     57 #ifdef JEMALLOC_ARENA_STRUCTS_A
     58 struct arena_run_s {
     59 	/* Index of bin this run is associated with. */
     60 	szind_t		binind;
     61 
     62 	/* Number of free regions in run. */
     63 	unsigned	nfree;
     64 
     65 	/* Per region allocated/deallocated bitmap. */
     66 	bitmap_t	bitmap[BITMAP_GROUPS_MAX];
     67 };
     68 
     69 /* Each element of the chunk map corresponds to one page within the chunk. */
     70 struct arena_chunk_map_bits_s {
     71 	/*
     72 	 * Run address (or size) and various flags are stored together.  The bit
     73 	 * layout looks like (assuming 32-bit system):
     74 	 *
     75 	 *   ???????? ???????? ???nnnnn nnndumla
     76 	 *
     77 	 * ? : Unallocated: Run address for first/last pages, unset for internal
     78 	 *                  pages.
     79 	 *     Small: Run page offset.
     80 	 *     Large: Run page count for first page, unset for trailing pages.
     81 	 * n : binind for small size class, BININD_INVALID for large size class.
     82 	 * d : dirty?
     83 	 * u : unzeroed?
     84 	 * m : decommitted?
     85 	 * l : large?
     86 	 * a : allocated?
     87 	 *
     88 	 * Following are example bit patterns for the three types of runs.
     89 	 *
     90 	 * p : run page offset
     91 	 * s : run size
     92 	 * n : binind for size class; large objects set these to BININD_INVALID
     93 	 * x : don't care
     94 	 * - : 0
     95 	 * + : 1
     96 	 * [DUMLA] : bit set
     97 	 * [dumla] : bit unset
     98 	 *
     99 	 *   Unallocated (clean):
    100 	 *     ssssssss ssssssss sss+++++ +++dum-a
    101 	 *     xxxxxxxx xxxxxxxx xxxxxxxx xxx-Uxxx
    102 	 *     ssssssss ssssssss sss+++++ +++dUm-a
    103 	 *
    104 	 *   Unallocated (dirty):
    105 	 *     ssssssss ssssssss sss+++++ +++D-m-a
    106 	 *     xxxxxxxx xxxxxxxx xxxxxxxx xxxxxxxx
    107 	 *     ssssssss ssssssss sss+++++ +++D-m-a
    108 	 *
    109 	 *   Small:
    110 	 *     pppppppp pppppppp pppnnnnn nnnd---A
    111 	 *     pppppppp pppppppp pppnnnnn nnn----A
    112 	 *     pppppppp pppppppp pppnnnnn nnnd---A
    113 	 *
    114 	 *   Large:
    115 	 *     ssssssss ssssssss sss+++++ +++D--LA
    116 	 *     xxxxxxxx xxxxxxxx xxxxxxxx xxxxxxxx
    117 	 *     -------- -------- ---+++++ +++D--LA
    118 	 *
    119 	 *   Large (sampled, size <= LARGE_MINCLASS):
    120 	 *     ssssssss ssssssss sssnnnnn nnnD--LA
    121 	 *     xxxxxxxx xxxxxxxx xxxxxxxx xxxxxxxx
    122 	 *     -------- -------- ---+++++ +++D--LA
    123 	 *
    124 	 *   Large (not sampled, size == LARGE_MINCLASS):
    125 	 *     ssssssss ssssssss sss+++++ +++D--LA
    126 	 *     xxxxxxxx xxxxxxxx xxxxxxxx xxxxxxxx
    127 	 *     -------- -------- ---+++++ +++D--LA
    128 	 */
    129 	size_t				bits;
    130 #define	CHUNK_MAP_ALLOCATED	((size_t)0x01U)
    131 #define	CHUNK_MAP_LARGE		((size_t)0x02U)
    132 #define	CHUNK_MAP_STATE_MASK	((size_t)0x3U)
    133 
    134 #define	CHUNK_MAP_DECOMMITTED	((size_t)0x04U)
    135 #define	CHUNK_MAP_UNZEROED	((size_t)0x08U)
    136 #define	CHUNK_MAP_DIRTY		((size_t)0x10U)
    137 #define	CHUNK_MAP_FLAGS_MASK	((size_t)0x1cU)
    138 
    139 #define	CHUNK_MAP_BININD_SHIFT	5
    140 #define	BININD_INVALID		((size_t)0xffU)
    141 #define	CHUNK_MAP_BININD_MASK	(BININD_INVALID << CHUNK_MAP_BININD_SHIFT)
    142 #define	CHUNK_MAP_BININD_INVALID CHUNK_MAP_BININD_MASK
    143 
    144 #define	CHUNK_MAP_RUNIND_SHIFT	(CHUNK_MAP_BININD_SHIFT + 8)
    145 #define	CHUNK_MAP_SIZE_SHIFT	(CHUNK_MAP_RUNIND_SHIFT - LG_PAGE)
    146 #define	CHUNK_MAP_SIZE_MASK						\
    147     (~(CHUNK_MAP_BININD_MASK | CHUNK_MAP_FLAGS_MASK | CHUNK_MAP_STATE_MASK))
    148 };
    149 
    150 struct arena_runs_dirty_link_s {
    151 	qr(arena_runs_dirty_link_t)	rd_link;
    152 };
    153 
    154 /*
    155  * Each arena_chunk_map_misc_t corresponds to one page within the chunk, just
    156  * like arena_chunk_map_bits_t.  Two separate arrays are stored within each
    157  * chunk header in order to improve cache locality.
    158  */
    159 struct arena_chunk_map_misc_s {
    160 	/*
    161 	 * Linkage for run trees.  There are two disjoint uses:
    162 	 *
    163 	 * 1) arena_t's runs_avail tree.
    164 	 * 2) arena_run_t conceptually uses this linkage for in-use non-full
    165 	 *    runs, rather than directly embedding linkage.
    166 	 */
    167 	rb_node(arena_chunk_map_misc_t)		rb_link;
    168 
    169 	union {
    170 		/* Linkage for list of dirty runs. */
    171 		arena_runs_dirty_link_t		rd;
    172 
    173 		/* Profile counters, used for large object runs. */
    174 		union {
    175 			void			*prof_tctx_pun;
    176 			prof_tctx_t		*prof_tctx;
    177 		};
    178 
    179 		/* Small region run metadata. */
    180 		arena_run_t			run;
    181 	};
    182 };
    183 typedef rb_tree(arena_chunk_map_misc_t) arena_run_tree_t;
    184 #endif /* JEMALLOC_ARENA_STRUCTS_A */
    185 
    186 #ifdef JEMALLOC_ARENA_STRUCTS_B
    187 /* Arena chunk header. */
    188 struct arena_chunk_s {
    189 	/*
    190 	 * A pointer to the arena that owns the chunk is stored within the node.
    191 	 * This field as a whole is used by chunks_rtree to support both
    192 	 * ivsalloc() and core-based debugging.
    193 	 */
    194 	extent_node_t		node;
    195 
    196 	/*
    197 	 * Map of pages within chunk that keeps track of free/large/small.  The
    198 	 * first map_bias entries are omitted, since the chunk header does not
    199 	 * need to be tracked in the map.  This omission saves a header page
    200 	 * for common chunk sizes (e.g. 4 MiB).
    201 	 */
    202 	arena_chunk_map_bits_t	map_bits[1]; /* Dynamically sized. */
    203 };
    204 
    205 /*
    206  * Read-only information associated with each element of arena_t's bins array
    207  * is stored separately, partly to reduce memory usage (only one copy, rather
    208  * than one per arena), but mainly to avoid false cacheline sharing.
    209  *
    210  * Each run has the following layout:
    211  *
    212  *               /--------------------\
    213  *               | pad?               |
    214  *               |--------------------|
    215  *               | redzone            |
    216  *   reg0_offset | region 0           |
    217  *               | redzone            |
    218  *               |--------------------| \
    219  *               | redzone            | |
    220  *               | region 1           |  > reg_interval
    221  *               | redzone            | /
    222  *               |--------------------|
    223  *               | ...                |
    224  *               | ...                |
    225  *               | ...                |
    226  *               |--------------------|
    227  *               | redzone            |
    228  *               | region nregs-1     |
    229  *               | redzone            |
    230  *               |--------------------|
    231  *               | alignment pad?     |
    232  *               \--------------------/
    233  *
    234  * reg_interval has at least the same minimum alignment as reg_size; this
    235  * preserves the alignment constraint that sa2u() depends on.  Alignment pad is
    236  * either 0 or redzone_size; it is present only if needed to align reg0_offset.
    237  */
    238 struct arena_bin_info_s {
    239 	/* Size of regions in a run for this bin's size class. */
    240 	size_t			reg_size;
    241 
    242 	/* Redzone size. */
    243 	size_t			redzone_size;
    244 
    245 	/* Interval between regions (reg_size + (redzone_size << 1)). */
    246 	size_t			reg_interval;
    247 
    248 	/* Total size of a run for this bin's size class. */
    249 	size_t			run_size;
    250 
    251 	/* Total number of regions in a run for this bin's size class. */
    252 	uint32_t		nregs;
    253 
    254 	/*
    255 	 * Metadata used to manipulate bitmaps for runs associated with this
    256 	 * bin.
    257 	 */
    258 	bitmap_info_t		bitmap_info;
    259 
    260 	/* Offset of first region in a run for this bin's size class. */
    261 	uint32_t		reg0_offset;
    262 };
    263 
    264 struct arena_bin_s {
    265 	/*
    266 	 * All operations on runcur, runs, and stats require that lock be
    267 	 * locked.  Run allocation/deallocation are protected by the arena lock,
    268 	 * which may be acquired while holding one or more bin locks, but not
    269 	 * vise versa.
    270 	 */
    271 	malloc_mutex_t		lock;
    272 
    273 	/*
    274 	 * Current run being used to service allocations of this bin's size
    275 	 * class.
    276 	 */
    277 	arena_run_t		*runcur;
    278 
    279 	/*
    280 	 * Tree of non-full runs.  This tree is used when looking for an
    281 	 * existing run when runcur is no longer usable.  We choose the
    282 	 * non-full run that is lowest in memory; this policy tends to keep
    283 	 * objects packed well, and it can also help reduce the number of
    284 	 * almost-empty chunks.
    285 	 */
    286 	arena_run_tree_t	runs;
    287 
    288 	/* Bin statistics. */
    289 	malloc_bin_stats_t	stats;
    290 };
    291 
    292 struct arena_s {
    293 	/* This arena's index within the arenas array. */
    294 	unsigned		ind;
    295 
    296 	/*
    297 	 * Number of threads currently assigned to this arena.  This field is
    298 	 * synchronized via atomic operations.
    299 	 */
    300 	unsigned		nthreads;
    301 
    302 	/*
    303 	 * There are three classes of arena operations from a locking
    304 	 * perspective:
    305 	 * 1) Thread assignment (modifies nthreads) is synchronized via atomics.
    306 	 * 2) Bin-related operations are protected by bin locks.
    307 	 * 3) Chunk- and run-related operations are protected by this mutex.
    308 	 */
    309 	malloc_mutex_t		lock;
    310 
    311 	arena_stats_t		stats;
    312 	/*
    313 	 * List of tcaches for extant threads associated with this arena.
    314 	 * Stats from these are merged incrementally, and at exit if
    315 	 * opt_stats_print is enabled.
    316 	 */
    317 	ql_head(tcache_t)	tcache_ql;
    318 
    319 	uint64_t		prof_accumbytes;
    320 
    321 	/*
    322 	 * PRNG state for cache index randomization of large allocation base
    323 	 * pointers.
    324 	 */
    325 	uint64_t		offset_state;
    326 
    327 	dss_prec_t		dss_prec;
    328 
    329 	/*
    330 	 * In order to avoid rapid chunk allocation/deallocation when an arena
    331 	 * oscillates right on the cusp of needing a new chunk, cache the most
    332 	 * recently freed chunk.  The spare is left in the arena's chunk trees
    333 	 * until it is deleted.
    334 	 *
    335 	 * There is one spare chunk per arena, rather than one spare total, in
    336 	 * order to avoid interactions between multiple threads that could make
    337 	 * a single spare inadequate.
    338 	 */
    339 	arena_chunk_t		*spare;
    340 
    341 	/* Minimum ratio (log base 2) of nactive:ndirty. */
    342 	ssize_t			lg_dirty_mult;
    343 
    344 	/* True if a thread is currently executing arena_purge_to_limit(). */
    345 	bool			purging;
    346 
    347 	/* Number of pages in active runs and huge regions. */
    348 	size_t			nactive;
    349 
    350 	/*
    351 	 * Current count of pages within unused runs that are potentially
    352 	 * dirty, and for which madvise(... MADV_DONTNEED) has not been called.
    353 	 * By tracking this, we can institute a limit on how much dirty unused
    354 	 * memory is mapped for each arena.
    355 	 */
    356 	size_t			ndirty;
    357 
    358 	/*
    359 	 * Unused dirty memory this arena manages.  Dirty memory is conceptually
    360 	 * tracked as an arbitrarily interleaved LRU of dirty runs and cached
    361 	 * chunks, but the list linkage is actually semi-duplicated in order to
    362 	 * avoid extra arena_chunk_map_misc_t space overhead.
    363 	 *
    364 	 *   LRU-----------------------------------------------------------MRU
    365 	 *
    366 	 *        /-- arena ---\
    367 	 *        |            |
    368 	 *        |            |
    369 	 *        |------------|                             /- chunk -\
    370 	 *   ...->|chunks_cache|<--------------------------->|  /----\ |<--...
    371 	 *        |------------|                             |  |node| |
    372 	 *        |            |                             |  |    | |
    373 	 *        |            |    /- run -\    /- run -\   |  |    | |
    374 	 *        |            |    |       |    |       |   |  |    | |
    375 	 *        |            |    |       |    |       |   |  |    | |
    376 	 *        |------------|    |-------|    |-------|   |  |----| |
    377 	 *   ...->|runs_dirty  |<-->|rd     |<-->|rd     |<---->|rd  |<----...
    378 	 *        |------------|    |-------|    |-------|   |  |----| |
    379 	 *        |            |    |       |    |       |   |  |    | |
    380 	 *        |            |    |       |    |       |   |  \----/ |
    381 	 *        |            |    \-------/    \-------/   |         |
    382 	 *        |            |                             |         |
    383 	 *        |            |                             |         |
    384 	 *        \------------/                             \---------/
    385 	 */
    386 	arena_runs_dirty_link_t	runs_dirty;
    387 	extent_node_t		chunks_cache;
    388 
    389 	/*
    390 	 * Approximate time in seconds from the creation of a set of unused
    391 	 * dirty pages until an equivalent set of unused dirty pages is purged
    392 	 * and/or reused.
    393 	 */
    394 	ssize_t			decay_time;
    395 	/* decay_time / SMOOTHSTEP_NSTEPS. */
    396 	nstime_t		decay_interval;
    397 	/*
    398 	 * Time at which the current decay interval logically started.  We do
    399 	 * not actually advance to a new epoch until sometime after it starts
    400 	 * because of scheduling and computation delays, and it is even possible
    401 	 * to completely skip epochs.  In all cases, during epoch advancement we
    402 	 * merge all relevant activity into the most recently recorded epoch.
    403 	 */
    404 	nstime_t		decay_epoch;
    405 	/* decay_deadline randomness generator. */
    406 	uint64_t		decay_jitter_state;
    407 	/*
    408 	 * Deadline for current epoch.  This is the sum of decay_interval and
    409 	 * per epoch jitter which is a uniform random variable in
    410 	 * [0..decay_interval).  Epochs always advance by precise multiples of
    411 	 * decay_interval, but we randomize the deadline to reduce the
    412 	 * likelihood of arenas purging in lockstep.
    413 	 */
    414 	nstime_t		decay_deadline;
    415 	/*
    416 	 * Number of dirty pages at beginning of current epoch.  During epoch
    417 	 * advancement we use the delta between decay_ndirty and ndirty to
    418 	 * determine how many dirty pages, if any, were generated, and record
    419 	 * the result in decay_backlog.
    420 	 */
    421 	size_t			decay_ndirty;
    422 	/*
    423 	 * Memoized result of arena_decay_backlog_npages_limit() corresponding
    424 	 * to the current contents of decay_backlog, i.e. the limit on how many
    425 	 * pages are allowed to exist for the decay epochs.
    426 	 */
    427 	size_t			decay_backlog_npages_limit;
    428 	/*
    429 	 * Trailing log of how many unused dirty pages were generated during
    430 	 * each of the past SMOOTHSTEP_NSTEPS decay epochs, where the last
    431 	 * element is the most recent epoch.  Corresponding epoch times are
    432 	 * relative to decay_epoch.
    433 	 */
    434 	size_t			decay_backlog[SMOOTHSTEP_NSTEPS];
    435 
    436 	/* Extant huge allocations. */
    437 	ql_head(extent_node_t)	huge;
    438 	/* Synchronizes all huge allocation/update/deallocation. */
    439 	malloc_mutex_t		huge_mtx;
    440 
    441 	/*
    442 	 * Trees of chunks that were previously allocated (trees differ only in
    443 	 * node ordering).  These are used when allocating chunks, in an attempt
    444 	 * to re-use address space.  Depending on function, different tree
    445 	 * orderings are needed, which is why there are two trees with the same
    446 	 * contents.
    447 	 */
    448 	extent_tree_t		chunks_szad_cached;
    449 	extent_tree_t		chunks_ad_cached;
    450 	extent_tree_t		chunks_szad_retained;
    451 	extent_tree_t		chunks_ad_retained;
    452 
    453 	malloc_mutex_t		chunks_mtx;
    454 	/* Cache of nodes that were allocated via base_alloc(). */
    455 	ql_head(extent_node_t)	node_cache;
    456 	malloc_mutex_t		node_cache_mtx;
    457 
    458 	/* User-configurable chunk hook functions. */
    459 	chunk_hooks_t		chunk_hooks;
    460 
    461 	/* bins is used to store trees of free regions. */
    462 	arena_bin_t		bins[NBINS];
    463 
    464 	/*
    465 	 * Quantized address-ordered trees of this arena's available runs.  The
    466 	 * trees are used for first-best-fit run allocation.
    467 	 */
    468 	arena_run_tree_t	runs_avail[1]; /* Dynamically sized. */
    469 };
    470 
    471 /* Used in conjunction with tsd for fast arena-related context lookup. */
    472 struct arena_tdata_s {
    473 	ticker_t		decay_ticker;
    474 };
    475 #endif /* JEMALLOC_ARENA_STRUCTS_B */
    476 
    477 #endif /* JEMALLOC_H_STRUCTS */
    478 /******************************************************************************/
    479 #ifdef JEMALLOC_H_EXTERNS
    480 
    481 static const size_t	large_pad =
    482 #ifdef JEMALLOC_CACHE_OBLIVIOUS
    483     PAGE
    484 #else
    485     0
    486 #endif
    487     ;
    488 
    489 extern purge_mode_t	opt_purge;
    490 extern const char	*purge_mode_names[];
    491 extern ssize_t		opt_lg_dirty_mult;
    492 extern ssize_t		opt_decay_time;
    493 
    494 extern arena_bin_info_t	arena_bin_info[NBINS];
    495 
    496 extern size_t		map_bias; /* Number of arena chunk header pages. */
    497 extern size_t		map_misc_offset;
    498 extern size_t		arena_maxrun; /* Max run size for arenas. */
    499 extern size_t		large_maxclass; /* Max large size class. */
    500 extern size_t		run_quantize_max; /* Max run_quantize_*() input. */
    501 extern unsigned		nlclasses; /* Number of large size classes. */
    502 extern unsigned		nhclasses; /* Number of huge size classes. */
    503 
    504 #ifdef JEMALLOC_JET
    505 typedef size_t (run_quantize_t)(size_t);
    506 extern run_quantize_t *run_quantize_floor;
    507 extern run_quantize_t *run_quantize_ceil;
    508 #endif
    509 void	arena_chunk_cache_maybe_insert(arena_t *arena, extent_node_t *node,
    510     bool cache);
    511 void	arena_chunk_cache_maybe_remove(arena_t *arena, extent_node_t *node,
    512     bool cache);
    513 extent_node_t	*arena_node_alloc(arena_t *arena);
    514 void	arena_node_dalloc(arena_t *arena, extent_node_t *node);
    515 void	*arena_chunk_alloc_huge(arena_t *arena, size_t usize, size_t alignment,
    516     bool *zero);
    517 void	arena_chunk_dalloc_huge(arena_t *arena, void *chunk, size_t usize);
    518 void	arena_chunk_ralloc_huge_similar(arena_t *arena, void *chunk,
    519     size_t oldsize, size_t usize);
    520 void	arena_chunk_ralloc_huge_shrink(arena_t *arena, void *chunk,
    521     size_t oldsize, size_t usize);
    522 bool	arena_chunk_ralloc_huge_expand(arena_t *arena, void *chunk,
    523     size_t oldsize, size_t usize, bool *zero);
    524 ssize_t	arena_lg_dirty_mult_get(arena_t *arena);
    525 bool	arena_lg_dirty_mult_set(arena_t *arena, ssize_t lg_dirty_mult);
    526 ssize_t	arena_decay_time_get(arena_t *arena);
    527 bool	arena_decay_time_set(arena_t *arena, ssize_t decay_time);
    528 void	arena_maybe_purge(arena_t *arena);
    529 void	arena_purge(arena_t *arena, bool all);
    530 void	arena_tcache_fill_small(tsd_t *tsd, arena_t *arena, tcache_bin_t *tbin,
    531     szind_t binind, uint64_t prof_accumbytes);
    532 void	arena_alloc_junk_small(void *ptr, arena_bin_info_t *bin_info,
    533     bool zero);
    534 #ifdef JEMALLOC_JET
    535 typedef void (arena_redzone_corruption_t)(void *, size_t, bool, size_t,
    536     uint8_t);
    537 extern arena_redzone_corruption_t *arena_redzone_corruption;
    538 typedef void (arena_dalloc_junk_small_t)(void *, arena_bin_info_t *);
    539 extern arena_dalloc_junk_small_t *arena_dalloc_junk_small;
    540 #else
    541 void	arena_dalloc_junk_small(void *ptr, arena_bin_info_t *bin_info);
    542 #endif
    543 void	arena_quarantine_junk_small(void *ptr, size_t usize);
    544 void	*arena_malloc_large(tsd_t *tsd, arena_t *arena, szind_t ind, bool zero);
    545 void	*arena_malloc_hard(tsd_t *tsd, arena_t *arena, size_t size, szind_t ind,
    546     bool zero, tcache_t *tcache);
    547 void	*arena_palloc(tsd_t *tsd, arena_t *arena, size_t usize,
    548     size_t alignment, bool zero, tcache_t *tcache);
    549 void	arena_prof_promoted(const void *ptr, size_t size);
    550 void	arena_dalloc_bin_junked_locked(arena_t *arena, arena_chunk_t *chunk,
    551     void *ptr, arena_chunk_map_bits_t *bitselm);
    552 void	arena_dalloc_bin(arena_t *arena, arena_chunk_t *chunk, void *ptr,
    553     size_t pageind, arena_chunk_map_bits_t *bitselm);
    554 void	arena_dalloc_small(tsd_t *tsd, arena_t *arena, arena_chunk_t *chunk,
    555     void *ptr, size_t pageind);
    556 #ifdef JEMALLOC_JET
    557 typedef void (arena_dalloc_junk_large_t)(void *, size_t);
    558 extern arena_dalloc_junk_large_t *arena_dalloc_junk_large;
    559 #else
    560 void	arena_dalloc_junk_large(void *ptr, size_t usize);
    561 #endif
    562 void	arena_dalloc_large_junked_locked(arena_t *arena, arena_chunk_t *chunk,
    563     void *ptr);
    564 void	arena_dalloc_large(tsd_t *tsd, arena_t *arena, arena_chunk_t *chunk,
    565     void *ptr);
    566 #ifdef JEMALLOC_JET
    567 typedef void (arena_ralloc_junk_large_t)(void *, size_t, size_t);
    568 extern arena_ralloc_junk_large_t *arena_ralloc_junk_large;
    569 #endif
    570 bool	arena_ralloc_no_move(tsd_t *tsd, void *ptr, size_t oldsize, size_t size,
    571     size_t extra, bool zero);
    572 void	*arena_ralloc(tsd_t *tsd, arena_t *arena, void *ptr, size_t oldsize,
    573     size_t size, size_t alignment, bool zero, tcache_t *tcache);
    574 dss_prec_t	arena_dss_prec_get(arena_t *arena);
    575 bool	arena_dss_prec_set(arena_t *arena, dss_prec_t dss_prec);
    576 ssize_t	arena_lg_dirty_mult_default_get(void);
    577 bool	arena_lg_dirty_mult_default_set(ssize_t lg_dirty_mult);
    578 ssize_t	arena_decay_time_default_get(void);
    579 bool	arena_decay_time_default_set(ssize_t decay_time);
    580 void	arena_basic_stats_merge(arena_t *arena, unsigned *nthreads,
    581     const char **dss, ssize_t *lg_dirty_mult, ssize_t *decay_time,
    582     size_t *nactive, size_t *ndirty);
    583 void	arena_stats_merge(arena_t *arena, unsigned *nthreads, const char **dss,
    584     ssize_t *lg_dirty_mult, ssize_t *decay_time, size_t *nactive,
    585     size_t *ndirty, arena_stats_t *astats, malloc_bin_stats_t *bstats,
    586     malloc_large_stats_t *lstats, malloc_huge_stats_t *hstats);
    587 unsigned	arena_nthreads_get(arena_t *arena);
    588 void	arena_nthreads_inc(arena_t *arena);
    589 void	arena_nthreads_dec(arena_t *arena);
    590 arena_t	*arena_new(unsigned ind);
    591 bool	arena_boot(void);
    592 void	arena_prefork(arena_t *arena);
    593 void	arena_postfork_parent(arena_t *arena);
    594 void	arena_postfork_child(arena_t *arena);
    595 
    596 #endif /* JEMALLOC_H_EXTERNS */
    597 /******************************************************************************/
    598 #ifdef JEMALLOC_H_INLINES
    599 
    600 #ifndef JEMALLOC_ENABLE_INLINE
    601 arena_chunk_map_bits_t	*arena_bitselm_get(arena_chunk_t *chunk,
    602     size_t pageind);
    603 arena_chunk_map_misc_t	*arena_miscelm_get(arena_chunk_t *chunk,
    604     size_t pageind);
    605 size_t	arena_miscelm_to_pageind(const arena_chunk_map_misc_t *miscelm);
    606 void	*arena_miscelm_to_rpages(arena_chunk_map_misc_t *miscelm);
    607 arena_chunk_map_misc_t	*arena_rd_to_miscelm(arena_runs_dirty_link_t *rd);
    608 arena_chunk_map_misc_t	*arena_run_to_miscelm(arena_run_t *run);
    609 size_t	*arena_mapbitsp_get(arena_chunk_t *chunk, size_t pageind);
    610 size_t	arena_mapbitsp_read(size_t *mapbitsp);
    611 size_t	arena_mapbits_get(arena_chunk_t *chunk, size_t pageind);
    612 size_t	arena_mapbits_size_decode(size_t mapbits);
    613 size_t	arena_mapbits_unallocated_size_get(arena_chunk_t *chunk,
    614     size_t pageind);
    615 size_t	arena_mapbits_large_size_get(arena_chunk_t *chunk, size_t pageind);
    616 size_t	arena_mapbits_small_runind_get(arena_chunk_t *chunk, size_t pageind);
    617 szind_t	arena_mapbits_binind_get(arena_chunk_t *chunk, size_t pageind);
    618 size_t	arena_mapbits_dirty_get(arena_chunk_t *chunk, size_t pageind);
    619 size_t	arena_mapbits_unzeroed_get(arena_chunk_t *chunk, size_t pageind);
    620 size_t	arena_mapbits_decommitted_get(arena_chunk_t *chunk, size_t pageind);
    621 size_t	arena_mapbits_large_get(arena_chunk_t *chunk, size_t pageind);
    622 size_t	arena_mapbits_allocated_get(arena_chunk_t *chunk, size_t pageind);
    623 void	arena_mapbitsp_write(size_t *mapbitsp, size_t mapbits);
    624 size_t	arena_mapbits_size_encode(size_t size);
    625 void	arena_mapbits_unallocated_set(arena_chunk_t *chunk, size_t pageind,
    626     size_t size, size_t flags);
    627 void	arena_mapbits_unallocated_size_set(arena_chunk_t *chunk, size_t pageind,
    628     size_t size);
    629 void	arena_mapbits_internal_set(arena_chunk_t *chunk, size_t pageind,
    630     size_t flags);
    631 void	arena_mapbits_large_set(arena_chunk_t *chunk, size_t pageind,
    632     size_t size, size_t flags);
    633 void	arena_mapbits_large_binind_set(arena_chunk_t *chunk, size_t pageind,
    634     szind_t binind);
    635 void	arena_mapbits_small_set(arena_chunk_t *chunk, size_t pageind,
    636     size_t runind, szind_t binind, size_t flags);
    637 void	arena_metadata_allocated_add(arena_t *arena, size_t size);
    638 void	arena_metadata_allocated_sub(arena_t *arena, size_t size);
    639 size_t	arena_metadata_allocated_get(arena_t *arena);
    640 bool	arena_prof_accum_impl(arena_t *arena, uint64_t accumbytes);
    641 bool	arena_prof_accum_locked(arena_t *arena, uint64_t accumbytes);
    642 bool	arena_prof_accum(arena_t *arena, uint64_t accumbytes);
    643 szind_t	arena_ptr_small_binind_get(const void *ptr, size_t mapbits);
    644 szind_t	arena_bin_index(arena_t *arena, arena_bin_t *bin);
    645 size_t	arena_run_regind(arena_run_t *run, arena_bin_info_t *bin_info,
    646     const void *ptr);
    647 prof_tctx_t	*arena_prof_tctx_get(const void *ptr);
    648 void	arena_prof_tctx_set(const void *ptr, size_t usize, prof_tctx_t *tctx);
    649 void	arena_prof_tctx_reset(const void *ptr, size_t usize,
    650     const void *old_ptr, prof_tctx_t *old_tctx);
    651 void	arena_decay_ticks(tsd_t *tsd, arena_t *arena, unsigned nticks);
    652 void	arena_decay_tick(tsd_t *tsd, arena_t *arena);
    653 void	*arena_malloc(tsd_t *tsd, arena_t *arena, size_t size, szind_t ind,
    654     bool zero, tcache_t *tcache, bool slow_path);
    655 arena_t	*arena_aalloc(const void *ptr);
    656 size_t	arena_salloc(const void *ptr, bool demote);
    657 void	arena_dalloc(tsd_t *tsd, void *ptr, tcache_t *tcache, bool slow_path);
    658 void	arena_sdalloc(tsd_t *tsd, void *ptr, size_t size, tcache_t *tcache);
    659 #endif
    660 
    661 #if (defined(JEMALLOC_ENABLE_INLINE) || defined(JEMALLOC_ARENA_C_))
    662 #  ifdef JEMALLOC_ARENA_INLINE_A
    663 JEMALLOC_ALWAYS_INLINE arena_chunk_map_bits_t *
    664 arena_bitselm_get(arena_chunk_t *chunk, size_t pageind)
    665 {
    666 
    667 	assert(pageind >= map_bias);
    668 	assert(pageind < chunk_npages);
    669 
    670 	return (&chunk->map_bits[pageind-map_bias]);
    671 }
    672 
    673 JEMALLOC_ALWAYS_INLINE arena_chunk_map_misc_t *
    674 arena_miscelm_get(arena_chunk_t *chunk, size_t pageind)
    675 {
    676 
    677 	assert(pageind >= map_bias);
    678 	assert(pageind < chunk_npages);
    679 
    680 	return ((arena_chunk_map_misc_t *)((uintptr_t)chunk +
    681 	    (uintptr_t)map_misc_offset) + pageind-map_bias);
    682 }
    683 
    684 JEMALLOC_ALWAYS_INLINE size_t
    685 arena_miscelm_to_pageind(const arena_chunk_map_misc_t *miscelm)
    686 {
    687 	arena_chunk_t *chunk = (arena_chunk_t *)CHUNK_ADDR2BASE(miscelm);
    688 	size_t pageind = ((uintptr_t)miscelm - ((uintptr_t)chunk +
    689 	    map_misc_offset)) / sizeof(arena_chunk_map_misc_t) + map_bias;
    690 
    691 	assert(pageind >= map_bias);
    692 	assert(pageind < chunk_npages);
    693 
    694 	return (pageind);
    695 }
    696 
    697 JEMALLOC_ALWAYS_INLINE void *
    698 arena_miscelm_to_rpages(arena_chunk_map_misc_t *miscelm)
    699 {
    700 	arena_chunk_t *chunk = (arena_chunk_t *)CHUNK_ADDR2BASE(miscelm);
    701 	size_t pageind = arena_miscelm_to_pageind(miscelm);
    702 
    703 	return ((void *)((uintptr_t)chunk + (pageind << LG_PAGE)));
    704 }
    705 
    706 JEMALLOC_ALWAYS_INLINE arena_chunk_map_misc_t *
    707 arena_rd_to_miscelm(arena_runs_dirty_link_t *rd)
    708 {
    709 	arena_chunk_map_misc_t *miscelm = (arena_chunk_map_misc_t
    710 	    *)((uintptr_t)rd - offsetof(arena_chunk_map_misc_t, rd));
    711 
    712 	assert(arena_miscelm_to_pageind(miscelm) >= map_bias);
    713 	assert(arena_miscelm_to_pageind(miscelm) < chunk_npages);
    714 
    715 	return (miscelm);
    716 }
    717 
    718 JEMALLOC_ALWAYS_INLINE arena_chunk_map_misc_t *
    719 arena_run_to_miscelm(arena_run_t *run)
    720 {
    721 	arena_chunk_map_misc_t *miscelm = (arena_chunk_map_misc_t
    722 	    *)((uintptr_t)run - offsetof(arena_chunk_map_misc_t, run));
    723 
    724 	assert(arena_miscelm_to_pageind(miscelm) >= map_bias);
    725 	assert(arena_miscelm_to_pageind(miscelm) < chunk_npages);
    726 
    727 	return (miscelm);
    728 }
    729 
    730 JEMALLOC_ALWAYS_INLINE size_t *
    731 arena_mapbitsp_get(arena_chunk_t *chunk, size_t pageind)
    732 {
    733 
    734 	return (&arena_bitselm_get(chunk, pageind)->bits);
    735 }
    736 
    737 JEMALLOC_ALWAYS_INLINE size_t
    738 arena_mapbitsp_read(size_t *mapbitsp)
    739 {
    740 
    741 	return (*mapbitsp);
    742 }
    743 
    744 JEMALLOC_ALWAYS_INLINE size_t
    745 arena_mapbits_get(arena_chunk_t *chunk, size_t pageind)
    746 {
    747 
    748 	return (arena_mapbitsp_read(arena_mapbitsp_get(chunk, pageind)));
    749 }
    750 
    751 JEMALLOC_ALWAYS_INLINE size_t
    752 arena_mapbits_size_decode(size_t mapbits)
    753 {
    754 	size_t size;
    755 
    756 #if CHUNK_MAP_SIZE_SHIFT > 0
    757 	size = (mapbits & CHUNK_MAP_SIZE_MASK) >> CHUNK_MAP_SIZE_SHIFT;
    758 #elif CHUNK_MAP_SIZE_SHIFT == 0
    759 	size = mapbits & CHUNK_MAP_SIZE_MASK;
    760 #else
    761 	size = (mapbits & CHUNK_MAP_SIZE_MASK) << -CHUNK_MAP_SIZE_SHIFT;
    762 #endif
    763 
    764 	return (size);
    765 }
    766 
    767 JEMALLOC_ALWAYS_INLINE size_t
    768 arena_mapbits_unallocated_size_get(arena_chunk_t *chunk, size_t pageind)
    769 {
    770 	size_t mapbits;
    771 
    772 	mapbits = arena_mapbits_get(chunk, pageind);
    773 	assert((mapbits & (CHUNK_MAP_LARGE|CHUNK_MAP_ALLOCATED)) == 0);
    774 	return (arena_mapbits_size_decode(mapbits));
    775 }
    776 
    777 JEMALLOC_ALWAYS_INLINE size_t
    778 arena_mapbits_large_size_get(arena_chunk_t *chunk, size_t pageind)
    779 {
    780 	size_t mapbits;
    781 
    782 	mapbits = arena_mapbits_get(chunk, pageind);
    783 	assert((mapbits & (CHUNK_MAP_LARGE|CHUNK_MAP_ALLOCATED)) ==
    784 	    (CHUNK_MAP_LARGE|CHUNK_MAP_ALLOCATED));
    785 	return (arena_mapbits_size_decode(mapbits));
    786 }
    787 
    788 JEMALLOC_ALWAYS_INLINE size_t
    789 arena_mapbits_small_runind_get(arena_chunk_t *chunk, size_t pageind)
    790 {
    791 	size_t mapbits;
    792 
    793 	mapbits = arena_mapbits_get(chunk, pageind);
    794 	assert((mapbits & (CHUNK_MAP_LARGE|CHUNK_MAP_ALLOCATED)) ==
    795 	    CHUNK_MAP_ALLOCATED);
    796 	return (mapbits >> CHUNK_MAP_RUNIND_SHIFT);
    797 }
    798 
    799 JEMALLOC_ALWAYS_INLINE szind_t
    800 arena_mapbits_binind_get(arena_chunk_t *chunk, size_t pageind)
    801 {
    802 	size_t mapbits;
    803 	szind_t binind;
    804 
    805 	mapbits = arena_mapbits_get(chunk, pageind);
    806 	binind = (mapbits & CHUNK_MAP_BININD_MASK) >> CHUNK_MAP_BININD_SHIFT;
    807 	assert(binind < NBINS || binind == BININD_INVALID);
    808 	return (binind);
    809 }
    810 
    811 JEMALLOC_ALWAYS_INLINE size_t
    812 arena_mapbits_dirty_get(arena_chunk_t *chunk, size_t pageind)
    813 {
    814 	size_t mapbits;
    815 
    816 	mapbits = arena_mapbits_get(chunk, pageind);
    817 	assert((mapbits & CHUNK_MAP_DECOMMITTED) == 0 || (mapbits &
    818 	    (CHUNK_MAP_DIRTY|CHUNK_MAP_UNZEROED)) == 0);
    819 	return (mapbits & CHUNK_MAP_DIRTY);
    820 }
    821 
    822 JEMALLOC_ALWAYS_INLINE size_t
    823 arena_mapbits_unzeroed_get(arena_chunk_t *chunk, size_t pageind)
    824 {
    825 	size_t mapbits;
    826 
    827 	mapbits = arena_mapbits_get(chunk, pageind);
    828 	assert((mapbits & CHUNK_MAP_DECOMMITTED) == 0 || (mapbits &
    829 	    (CHUNK_MAP_DIRTY|CHUNK_MAP_UNZEROED)) == 0);
    830 	return (mapbits & CHUNK_MAP_UNZEROED);
    831 }
    832 
    833 JEMALLOC_ALWAYS_INLINE size_t
    834 arena_mapbits_decommitted_get(arena_chunk_t *chunk, size_t pageind)
    835 {
    836 	size_t mapbits;
    837 
    838 	mapbits = arena_mapbits_get(chunk, pageind);
    839 	assert((mapbits & CHUNK_MAP_DECOMMITTED) == 0 || (mapbits &
    840 	    (CHUNK_MAP_DIRTY|CHUNK_MAP_UNZEROED)) == 0);
    841 	return (mapbits & CHUNK_MAP_DECOMMITTED);
    842 }
    843 
    844 JEMALLOC_ALWAYS_INLINE size_t
    845 arena_mapbits_large_get(arena_chunk_t *chunk, size_t pageind)
    846 {
    847 	size_t mapbits;
    848 
    849 	mapbits = arena_mapbits_get(chunk, pageind);
    850 	return (mapbits & CHUNK_MAP_LARGE);
    851 }
    852 
    853 JEMALLOC_ALWAYS_INLINE size_t
    854 arena_mapbits_allocated_get(arena_chunk_t *chunk, size_t pageind)
    855 {
    856 	size_t mapbits;
    857 
    858 	mapbits = arena_mapbits_get(chunk, pageind);
    859 	return (mapbits & CHUNK_MAP_ALLOCATED);
    860 }
    861 
    862 JEMALLOC_ALWAYS_INLINE void
    863 arena_mapbitsp_write(size_t *mapbitsp, size_t mapbits)
    864 {
    865 
    866 	*mapbitsp = mapbits;
    867 }
    868 
    869 JEMALLOC_ALWAYS_INLINE size_t
    870 arena_mapbits_size_encode(size_t size)
    871 {
    872 	size_t mapbits;
    873 
    874 #if CHUNK_MAP_SIZE_SHIFT > 0
    875 	mapbits = size << CHUNK_MAP_SIZE_SHIFT;
    876 #elif CHUNK_MAP_SIZE_SHIFT == 0
    877 	mapbits = size;
    878 #else
    879 	mapbits = size >> -CHUNK_MAP_SIZE_SHIFT;
    880 #endif
    881 
    882 	assert((mapbits & ~CHUNK_MAP_SIZE_MASK) == 0);
    883 	return (mapbits);
    884 }
    885 
    886 JEMALLOC_ALWAYS_INLINE void
    887 arena_mapbits_unallocated_set(arena_chunk_t *chunk, size_t pageind, size_t size,
    888     size_t flags)
    889 {
    890 	size_t *mapbitsp = arena_mapbitsp_get(chunk, pageind);
    891 
    892 	assert((size & PAGE_MASK) == 0);
    893 	assert((flags & CHUNK_MAP_FLAGS_MASK) == flags);
    894 	assert((flags & CHUNK_MAP_DECOMMITTED) == 0 || (flags &
    895 	    (CHUNK_MAP_DIRTY|CHUNK_MAP_UNZEROED)) == 0);
    896 	arena_mapbitsp_write(mapbitsp, arena_mapbits_size_encode(size) |
    897 	    CHUNK_MAP_BININD_INVALID | flags);
    898 }
    899 
    900 JEMALLOC_ALWAYS_INLINE void
    901 arena_mapbits_unallocated_size_set(arena_chunk_t *chunk, size_t pageind,
    902     size_t size)
    903 {
    904 	size_t *mapbitsp = arena_mapbitsp_get(chunk, pageind);
    905 	size_t mapbits = arena_mapbitsp_read(mapbitsp);
    906 
    907 	assert((size & PAGE_MASK) == 0);
    908 	assert((mapbits & (CHUNK_MAP_LARGE|CHUNK_MAP_ALLOCATED)) == 0);
    909 	arena_mapbitsp_write(mapbitsp, arena_mapbits_size_encode(size) |
    910 	    (mapbits & ~CHUNK_MAP_SIZE_MASK));
    911 }
    912 
    913 JEMALLOC_ALWAYS_INLINE void
    914 arena_mapbits_internal_set(arena_chunk_t *chunk, size_t pageind, size_t flags)
    915 {
    916 	size_t *mapbitsp = arena_mapbitsp_get(chunk, pageind);
    917 
    918 	assert((flags & CHUNK_MAP_UNZEROED) == flags);
    919 	arena_mapbitsp_write(mapbitsp, flags);
    920 }
    921 
    922 JEMALLOC_ALWAYS_INLINE void
    923 arena_mapbits_large_set(arena_chunk_t *chunk, size_t pageind, size_t size,
    924     size_t flags)
    925 {
    926 	size_t *mapbitsp = arena_mapbitsp_get(chunk, pageind);
    927 
    928 	assert((size & PAGE_MASK) == 0);
    929 	assert((flags & CHUNK_MAP_FLAGS_MASK) == flags);
    930 	assert((flags & CHUNK_MAP_DECOMMITTED) == 0 || (flags &
    931 	    (CHUNK_MAP_DIRTY|CHUNK_MAP_UNZEROED)) == 0);
    932 	arena_mapbitsp_write(mapbitsp, arena_mapbits_size_encode(size) |
    933 	    CHUNK_MAP_BININD_INVALID | flags | CHUNK_MAP_LARGE |
    934 	    CHUNK_MAP_ALLOCATED);
    935 }
    936 
    937 JEMALLOC_ALWAYS_INLINE void
    938 arena_mapbits_large_binind_set(arena_chunk_t *chunk, size_t pageind,
    939     szind_t binind)
    940 {
    941 	size_t *mapbitsp = arena_mapbitsp_get(chunk, pageind);
    942 	size_t mapbits = arena_mapbitsp_read(mapbitsp);
    943 
    944 	assert(binind <= BININD_INVALID);
    945 	assert(arena_mapbits_large_size_get(chunk, pageind) == LARGE_MINCLASS +
    946 	    large_pad);
    947 	arena_mapbitsp_write(mapbitsp, (mapbits & ~CHUNK_MAP_BININD_MASK) |
    948 	    (binind << CHUNK_MAP_BININD_SHIFT));
    949 }
    950 
    951 JEMALLOC_ALWAYS_INLINE void
    952 arena_mapbits_small_set(arena_chunk_t *chunk, size_t pageind, size_t runind,
    953     szind_t binind, size_t flags)
    954 {
    955 	size_t *mapbitsp = arena_mapbitsp_get(chunk, pageind);
    956 
    957 	assert(binind < BININD_INVALID);
    958 	assert(pageind - runind >= map_bias);
    959 	assert((flags & CHUNK_MAP_UNZEROED) == flags);
    960 	arena_mapbitsp_write(mapbitsp, (runind << CHUNK_MAP_RUNIND_SHIFT) |
    961 	    (binind << CHUNK_MAP_BININD_SHIFT) | flags | CHUNK_MAP_ALLOCATED);
    962 }
    963 
    964 JEMALLOC_INLINE void
    965 arena_metadata_allocated_add(arena_t *arena, size_t size)
    966 {
    967 
    968 	atomic_add_z(&arena->stats.metadata_allocated, size);
    969 }
    970 
    971 JEMALLOC_INLINE void
    972 arena_metadata_allocated_sub(arena_t *arena, size_t size)
    973 {
    974 
    975 	atomic_sub_z(&arena->stats.metadata_allocated, size);
    976 }
    977 
    978 JEMALLOC_INLINE size_t
    979 arena_metadata_allocated_get(arena_t *arena)
    980 {
    981 
    982 	return (atomic_read_z(&arena->stats.metadata_allocated));
    983 }
    984 
    985 JEMALLOC_INLINE bool
    986 arena_prof_accum_impl(arena_t *arena, uint64_t accumbytes)
    987 {
    988 
    989 	cassert(config_prof);
    990 	assert(prof_interval != 0);
    991 
    992 	arena->prof_accumbytes += accumbytes;
    993 	if (arena->prof_accumbytes >= prof_interval) {
    994 		arena->prof_accumbytes -= prof_interval;
    995 		return (true);
    996 	}
    997 	return (false);
    998 }
    999 
   1000 JEMALLOC_INLINE bool
   1001 arena_prof_accum_locked(arena_t *arena, uint64_t accumbytes)
   1002 {
   1003 
   1004 	cassert(config_prof);
   1005 
   1006 	if (likely(prof_interval == 0))
   1007 		return (false);
   1008 	return (arena_prof_accum_impl(arena, accumbytes));
   1009 }
   1010 
   1011 JEMALLOC_INLINE bool
   1012 arena_prof_accum(arena_t *arena, uint64_t accumbytes)
   1013 {
   1014 
   1015 	cassert(config_prof);
   1016 
   1017 	if (likely(prof_interval == 0))
   1018 		return (false);
   1019 
   1020 	{
   1021 		bool ret;
   1022 
   1023 		malloc_mutex_lock(&arena->lock);
   1024 		ret = arena_prof_accum_impl(arena, accumbytes);
   1025 		malloc_mutex_unlock(&arena->lock);
   1026 		return (ret);
   1027 	}
   1028 }
   1029 
   1030 JEMALLOC_ALWAYS_INLINE szind_t
   1031 arena_ptr_small_binind_get(const void *ptr, size_t mapbits)
   1032 {
   1033 	szind_t binind;
   1034 
   1035 	binind = (mapbits & CHUNK_MAP_BININD_MASK) >> CHUNK_MAP_BININD_SHIFT;
   1036 
   1037 	if (config_debug) {
   1038 		arena_chunk_t *chunk;
   1039 		arena_t *arena;
   1040 		size_t pageind;
   1041 		size_t actual_mapbits;
   1042 		size_t rpages_ind;
   1043 		arena_run_t *run;
   1044 		arena_bin_t *bin;
   1045 		szind_t run_binind, actual_binind;
   1046 		arena_bin_info_t *bin_info;
   1047 		arena_chunk_map_misc_t *miscelm;
   1048 		void *rpages;
   1049 
   1050 		assert(binind != BININD_INVALID);
   1051 		assert(binind < NBINS);
   1052 		chunk = (arena_chunk_t *)CHUNK_ADDR2BASE(ptr);
   1053 		arena = extent_node_arena_get(&chunk->node);
   1054 		pageind = ((uintptr_t)ptr - (uintptr_t)chunk) >> LG_PAGE;
   1055 		actual_mapbits = arena_mapbits_get(chunk, pageind);
   1056 		assert(mapbits == actual_mapbits);
   1057 		assert(arena_mapbits_large_get(chunk, pageind) == 0);
   1058 		assert(arena_mapbits_allocated_get(chunk, pageind) != 0);
   1059 		rpages_ind = pageind - arena_mapbits_small_runind_get(chunk,
   1060 		    pageind);
   1061 		miscelm = arena_miscelm_get(chunk, rpages_ind);
   1062 		run = &miscelm->run;
   1063 		run_binind = run->binind;
   1064 		bin = &arena->bins[run_binind];
   1065 		actual_binind = (szind_t)(bin - arena->bins);
   1066 		assert(run_binind == actual_binind);
   1067 		bin_info = &arena_bin_info[actual_binind];
   1068 		rpages = arena_miscelm_to_rpages(miscelm);
   1069 		assert(((uintptr_t)ptr - ((uintptr_t)rpages +
   1070 		    (uintptr_t)bin_info->reg0_offset)) % bin_info->reg_interval
   1071 		    == 0);
   1072 	}
   1073 
   1074 	return (binind);
   1075 }
   1076 #  endif /* JEMALLOC_ARENA_INLINE_A */
   1077 
   1078 #  ifdef JEMALLOC_ARENA_INLINE_B
   1079 JEMALLOC_INLINE szind_t
   1080 arena_bin_index(arena_t *arena, arena_bin_t *bin)
   1081 {
   1082 	szind_t binind = (szind_t)(bin - arena->bins);
   1083 	assert(binind < NBINS);
   1084 	return (binind);
   1085 }
   1086 
   1087 JEMALLOC_INLINE size_t
   1088 arena_run_regind(arena_run_t *run, arena_bin_info_t *bin_info, const void *ptr)
   1089 {
   1090 	size_t diff, interval, shift, regind;
   1091 	arena_chunk_map_misc_t *miscelm = arena_run_to_miscelm(run);
   1092 	void *rpages = arena_miscelm_to_rpages(miscelm);
   1093 
   1094 	/*
   1095 	 * Freeing a pointer lower than region zero can cause assertion
   1096 	 * failure.
   1097 	 */
   1098 	assert((uintptr_t)ptr >= (uintptr_t)rpages +
   1099 	    (uintptr_t)bin_info->reg0_offset);
   1100 
   1101 	/*
   1102 	 * Avoid doing division with a variable divisor if possible.  Using
   1103 	 * actual division here can reduce allocator throughput by over 20%!
   1104 	 */
   1105 	diff = (size_t)((uintptr_t)ptr - (uintptr_t)rpages -
   1106 	    bin_info->reg0_offset);
   1107 
   1108 	/* Rescale (factor powers of 2 out of the numerator and denominator). */
   1109 	interval = bin_info->reg_interval;
   1110 	shift = ffs_zu(interval) - 1;
   1111 	diff >>= shift;
   1112 	interval >>= shift;
   1113 
   1114 	if (interval == 1) {
   1115 		/* The divisor was a power of 2. */
   1116 		regind = diff;
   1117 	} else {
   1118 		/*
   1119 		 * To divide by a number D that is not a power of two we
   1120 		 * multiply by (2^21 / D) and then right shift by 21 positions.
   1121 		 *
   1122 		 *   X / D
   1123 		 *
   1124 		 * becomes
   1125 		 *
   1126 		 *   (X * interval_invs[D - 3]) >> SIZE_INV_SHIFT
   1127 		 *
   1128 		 * We can omit the first three elements, because we never
   1129 		 * divide by 0, and 1 and 2 are both powers of two, which are
   1130 		 * handled above.
   1131 		 */
   1132 #define	SIZE_INV_SHIFT	((sizeof(size_t) << 3) - LG_RUN_MAXREGS)
   1133 #define	SIZE_INV(s)	(((ZU(1) << SIZE_INV_SHIFT) / (s)) + 1)
   1134 		static const size_t interval_invs[] = {
   1135 		    SIZE_INV(3),
   1136 		    SIZE_INV(4), SIZE_INV(5), SIZE_INV(6), SIZE_INV(7),
   1137 		    SIZE_INV(8), SIZE_INV(9), SIZE_INV(10), SIZE_INV(11),
   1138 		    SIZE_INV(12), SIZE_INV(13), SIZE_INV(14), SIZE_INV(15),
   1139 		    SIZE_INV(16), SIZE_INV(17), SIZE_INV(18), SIZE_INV(19),
   1140 		    SIZE_INV(20), SIZE_INV(21), SIZE_INV(22), SIZE_INV(23),
   1141 		    SIZE_INV(24), SIZE_INV(25), SIZE_INV(26), SIZE_INV(27),
   1142 		    SIZE_INV(28), SIZE_INV(29), SIZE_INV(30), SIZE_INV(31)
   1143 		};
   1144 
   1145 		if (likely(interval <= ((sizeof(interval_invs) / sizeof(size_t))
   1146 		    + 2))) {
   1147 			regind = (diff * interval_invs[interval - 3]) >>
   1148 			    SIZE_INV_SHIFT;
   1149 		} else
   1150 			regind = diff / interval;
   1151 #undef SIZE_INV
   1152 #undef SIZE_INV_SHIFT
   1153 	}
   1154 	assert(diff == regind * interval);
   1155 	assert(regind < bin_info->nregs);
   1156 
   1157 	return (regind);
   1158 }
   1159 
   1160 JEMALLOC_INLINE prof_tctx_t *
   1161 arena_prof_tctx_get(const void *ptr)
   1162 {
   1163 	prof_tctx_t *ret;
   1164 	arena_chunk_t *chunk;
   1165 
   1166 	cassert(config_prof);
   1167 	assert(ptr != NULL);
   1168 
   1169 	chunk = (arena_chunk_t *)CHUNK_ADDR2BASE(ptr);
   1170 	if (likely(chunk != ptr)) {
   1171 		size_t pageind = ((uintptr_t)ptr - (uintptr_t)chunk) >> LG_PAGE;
   1172 		size_t mapbits = arena_mapbits_get(chunk, pageind);
   1173 		assert((mapbits & CHUNK_MAP_ALLOCATED) != 0);
   1174 		if (likely((mapbits & CHUNK_MAP_LARGE) == 0))
   1175 			ret = (prof_tctx_t *)(uintptr_t)1U;
   1176 		else {
   1177 			arena_chunk_map_misc_t *elm = arena_miscelm_get(chunk,
   1178 			    pageind);
   1179 			ret = atomic_read_p(&elm->prof_tctx_pun);
   1180 		}
   1181 	} else
   1182 		ret = huge_prof_tctx_get(ptr);
   1183 
   1184 	return (ret);
   1185 }
   1186 
   1187 JEMALLOC_INLINE void
   1188 arena_prof_tctx_set(const void *ptr, size_t usize, prof_tctx_t *tctx)
   1189 {
   1190 	arena_chunk_t *chunk;
   1191 
   1192 	cassert(config_prof);
   1193 	assert(ptr != NULL);
   1194 
   1195 	chunk = (arena_chunk_t *)CHUNK_ADDR2BASE(ptr);
   1196 	if (likely(chunk != ptr)) {
   1197 		size_t pageind = ((uintptr_t)ptr - (uintptr_t)chunk) >> LG_PAGE;
   1198 
   1199 		assert(arena_mapbits_allocated_get(chunk, pageind) != 0);
   1200 
   1201 		if (unlikely(usize > SMALL_MAXCLASS || (uintptr_t)tctx >
   1202 		    (uintptr_t)1U)) {
   1203 			arena_chunk_map_misc_t *elm;
   1204 
   1205 			assert(arena_mapbits_large_get(chunk, pageind) != 0);
   1206 
   1207 			elm = arena_miscelm_get(chunk, pageind);
   1208 			atomic_write_p(&elm->prof_tctx_pun, tctx);
   1209 		} else {
   1210 			/*
   1211 			 * tctx must always be initialized for large runs.
   1212 			 * Assert that the surrounding conditional logic is
   1213 			 * equivalent to checking whether ptr refers to a large
   1214 			 * run.
   1215 			 */
   1216 			assert(arena_mapbits_large_get(chunk, pageind) == 0);
   1217 		}
   1218 	} else
   1219 		huge_prof_tctx_set(ptr, tctx);
   1220 }
   1221 
   1222 JEMALLOC_INLINE void
   1223 arena_prof_tctx_reset(const void *ptr, size_t usize, const void *old_ptr,
   1224     prof_tctx_t *old_tctx)
   1225 {
   1226 
   1227 	cassert(config_prof);
   1228 	assert(ptr != NULL);
   1229 
   1230 	if (unlikely(usize > SMALL_MAXCLASS || (ptr == old_ptr &&
   1231 	    (uintptr_t)old_tctx > (uintptr_t)1U))) {
   1232 		arena_chunk_t *chunk = (arena_chunk_t *)CHUNK_ADDR2BASE(ptr);
   1233 		if (likely(chunk != ptr)) {
   1234 			size_t pageind;
   1235 			arena_chunk_map_misc_t *elm;
   1236 
   1237 			pageind = ((uintptr_t)ptr - (uintptr_t)chunk) >>
   1238 			    LG_PAGE;
   1239 			assert(arena_mapbits_allocated_get(chunk, pageind) !=
   1240 			    0);
   1241 			assert(arena_mapbits_large_get(chunk, pageind) != 0);
   1242 
   1243 			elm = arena_miscelm_get(chunk, pageind);
   1244 			atomic_write_p(&elm->prof_tctx_pun,
   1245 			    (prof_tctx_t *)(uintptr_t)1U);
   1246 		} else
   1247 			huge_prof_tctx_reset(ptr);
   1248 	}
   1249 }
   1250 
   1251 JEMALLOC_ALWAYS_INLINE void
   1252 arena_decay_ticks(tsd_t *tsd, arena_t *arena, unsigned nticks)
   1253 {
   1254 	ticker_t *decay_ticker;
   1255 
   1256 	if (unlikely(tsd == NULL))
   1257 		return;
   1258 	decay_ticker = decay_ticker_get(tsd, arena->ind);
   1259 	if (unlikely(decay_ticker == NULL))
   1260 		return;
   1261 	if (unlikely(ticker_ticks(decay_ticker, nticks)))
   1262 		arena_purge(arena, false);
   1263 }
   1264 
   1265 JEMALLOC_ALWAYS_INLINE void
   1266 arena_decay_tick(tsd_t *tsd, arena_t *arena)
   1267 {
   1268 
   1269 	arena_decay_ticks(tsd, arena, 1);
   1270 }
   1271 
   1272 JEMALLOC_ALWAYS_INLINE void *
   1273 arena_malloc(tsd_t *tsd, arena_t *arena, size_t size, szind_t ind, bool zero,
   1274     tcache_t *tcache, bool slow_path)
   1275 {
   1276 
   1277 	assert(size != 0);
   1278 
   1279 	if (likely(tcache != NULL)) {
   1280 		if (likely(size <= SMALL_MAXCLASS)) {
   1281 			return (tcache_alloc_small(tsd, arena, tcache, size,
   1282 			    ind, zero, slow_path));
   1283 		}
   1284 		if (likely(size <= tcache_maxclass)) {
   1285 			return (tcache_alloc_large(tsd, arena, tcache, size,
   1286 			    ind, zero, slow_path));
   1287 		}
   1288 		/* (size > tcache_maxclass) case falls through. */
   1289 		assert(size > tcache_maxclass);
   1290 	}
   1291 
   1292 	return (arena_malloc_hard(tsd, arena, size, ind, zero, tcache));
   1293 }
   1294 
   1295 JEMALLOC_ALWAYS_INLINE arena_t *
   1296 arena_aalloc(const void *ptr)
   1297 {
   1298 	arena_chunk_t *chunk;
   1299 
   1300 	chunk = (arena_chunk_t *)CHUNK_ADDR2BASE(ptr);
   1301 	if (likely(chunk != ptr))
   1302 		return (extent_node_arena_get(&chunk->node));
   1303 	else
   1304 		return (huge_aalloc(ptr));
   1305 }
   1306 
   1307 /* Return the size of the allocation pointed to by ptr. */
   1308 JEMALLOC_ALWAYS_INLINE size_t
   1309 arena_salloc(const void *ptr, bool demote)
   1310 {
   1311 	size_t ret;
   1312 	arena_chunk_t *chunk;
   1313 	size_t pageind;
   1314 	szind_t binind;
   1315 
   1316 	assert(ptr != NULL);
   1317 
   1318 	chunk = (arena_chunk_t *)CHUNK_ADDR2BASE(ptr);
   1319 	if (likely(chunk != ptr)) {
   1320 		pageind = ((uintptr_t)ptr - (uintptr_t)chunk) >> LG_PAGE;
   1321 		assert(arena_mapbits_allocated_get(chunk, pageind) != 0);
   1322 		binind = arena_mapbits_binind_get(chunk, pageind);
   1323 		if (unlikely(binind == BININD_INVALID || (config_prof && !demote
   1324 		    && arena_mapbits_large_get(chunk, pageind) != 0))) {
   1325 			/*
   1326 			 * Large allocation.  In the common case (demote), and
   1327 			 * as this is an inline function, most callers will only
   1328 			 * end up looking at binind to determine that ptr is a
   1329 			 * small allocation.
   1330 			 */
   1331 			assert(config_cache_oblivious || ((uintptr_t)ptr &
   1332 			    PAGE_MASK) == 0);
   1333 			ret = arena_mapbits_large_size_get(chunk, pageind) -
   1334 			    large_pad;
   1335 			assert(ret != 0);
   1336 			assert(pageind + ((ret+large_pad)>>LG_PAGE) <=
   1337 			    chunk_npages);
   1338 			assert(arena_mapbits_dirty_get(chunk, pageind) ==
   1339 			    arena_mapbits_dirty_get(chunk,
   1340 			    pageind+((ret+large_pad)>>LG_PAGE)-1));
   1341 		} else {
   1342 			/*
   1343 			 * Small allocation (possibly promoted to a large
   1344 			 * object).
   1345 			 */
   1346 			assert(arena_mapbits_large_get(chunk, pageind) != 0 ||
   1347 			    arena_ptr_small_binind_get(ptr,
   1348 			    arena_mapbits_get(chunk, pageind)) == binind);
   1349 			ret = index2size(binind);
   1350 		}
   1351 	} else
   1352 		ret = huge_salloc(ptr);
   1353 
   1354 	return (ret);
   1355 }
   1356 
   1357 JEMALLOC_ALWAYS_INLINE void
   1358 arena_dalloc(tsd_t *tsd, void *ptr, tcache_t *tcache, bool slow_path)
   1359 {
   1360 	arena_chunk_t *chunk;
   1361 	size_t pageind, mapbits;
   1362 
   1363 	assert(ptr != NULL);
   1364 
   1365 	chunk = (arena_chunk_t *)CHUNK_ADDR2BASE(ptr);
   1366 	if (likely(chunk != ptr)) {
   1367 		pageind = ((uintptr_t)ptr - (uintptr_t)chunk) >> LG_PAGE;
   1368 #if defined(__ANDROID__)
   1369 		/* Verify the ptr is actually in the chunk. */
   1370 		if (unlikely(pageind < map_bias || pageind >= chunk_npages)) {
   1371 		    __libc_fatal("Invalid address %p passed to free: invalid page index", ptr);
   1372 		}
   1373 #endif
   1374 		mapbits = arena_mapbits_get(chunk, pageind);
   1375 		assert(arena_mapbits_allocated_get(chunk, pageind) != 0);
   1376 #if defined(__ANDROID__)
   1377 		/* Verify the ptr has been allocated. */
   1378 		if (unlikely((mapbits & CHUNK_MAP_ALLOCATED) == 0)) {
   1379 		    __libc_fatal("Invalid address %p passed to free: value not allocated", ptr);
   1380 		}
   1381 #endif
   1382 		if (likely((mapbits & CHUNK_MAP_LARGE) == 0)) {
   1383 			/* Small allocation. */
   1384 			if (likely(tcache != NULL)) {
   1385 				szind_t binind = arena_ptr_small_binind_get(ptr,
   1386 				    mapbits);
   1387 				tcache_dalloc_small(tsd, tcache, ptr, binind,
   1388 				    slow_path);
   1389 			} else {
   1390 				arena_dalloc_small(tsd, extent_node_arena_get(
   1391 				    &chunk->node), chunk, ptr, pageind);
   1392 			}
   1393 		} else {
   1394 			size_t size = arena_mapbits_large_size_get(chunk,
   1395 			    pageind);
   1396 
   1397 			assert(config_cache_oblivious || ((uintptr_t)ptr &
   1398 			    PAGE_MASK) == 0);
   1399 
   1400 			if (likely(tcache != NULL) && size - large_pad <=
   1401 			    tcache_maxclass) {
   1402 				tcache_dalloc_large(tsd, tcache, ptr, size -
   1403 				    large_pad, slow_path);
   1404 			} else {
   1405 				arena_dalloc_large(tsd, extent_node_arena_get(
   1406 				    &chunk->node), chunk, ptr);
   1407 			}
   1408 		}
   1409 	} else
   1410 		huge_dalloc(tsd, ptr, tcache);
   1411 }
   1412 
   1413 JEMALLOC_ALWAYS_INLINE void
   1414 arena_sdalloc(tsd_t *tsd, void *ptr, size_t size, tcache_t *tcache)
   1415 {
   1416 	arena_chunk_t *chunk;
   1417 
   1418 	chunk = (arena_chunk_t *)CHUNK_ADDR2BASE(ptr);
   1419 	if (likely(chunk != ptr)) {
   1420 		if (config_prof && opt_prof) {
   1421 			size_t pageind = ((uintptr_t)ptr - (uintptr_t)chunk) >>
   1422 			    LG_PAGE;
   1423 			assert(arena_mapbits_allocated_get(chunk, pageind) !=
   1424 			    0);
   1425 			if (arena_mapbits_large_get(chunk, pageind) != 0) {
   1426 				/*
   1427 				 * Make sure to use promoted size, not request
   1428 				 * size.
   1429 				 */
   1430 				size = arena_mapbits_large_size_get(chunk,
   1431 				    pageind) - large_pad;
   1432 			}
   1433 		}
   1434 		assert(s2u(size) == s2u(arena_salloc(ptr, false)));
   1435 
   1436 		if (likely(size <= SMALL_MAXCLASS)) {
   1437 			/* Small allocation. */
   1438 			if (likely(tcache != NULL)) {
   1439 				szind_t binind = size2index(size);
   1440 				tcache_dalloc_small(tsd, tcache, ptr, binind,
   1441 				    true);
   1442 			} else {
   1443 				size_t pageind = ((uintptr_t)ptr -
   1444 				    (uintptr_t)chunk) >> LG_PAGE;
   1445 				arena_dalloc_small(tsd, extent_node_arena_get(
   1446 				    &chunk->node), chunk, ptr, pageind);
   1447 			}
   1448 		} else {
   1449 			assert(config_cache_oblivious || ((uintptr_t)ptr &
   1450 			    PAGE_MASK) == 0);
   1451 
   1452 			if (likely(tcache != NULL) && size <= tcache_maxclass) {
   1453 				tcache_dalloc_large(tsd, tcache, ptr, size,
   1454 				    true);
   1455 			} else {
   1456 				arena_dalloc_large(tsd, extent_node_arena_get(
   1457 				    &chunk->node), chunk, ptr);
   1458 			}
   1459 		}
   1460 	} else
   1461 		huge_dalloc(tsd, ptr, tcache);
   1462 }
   1463 #  endif /* JEMALLOC_ARENA_INLINE_B */
   1464 #endif
   1465 
   1466 #endif /* JEMALLOC_H_INLINES */
   1467 /******************************************************************************/
   1468