.\" SPDX-License-Identifier: BSD-2-Clause .\" Copyright (C) 2014 - 2021 Intel Corporation. .\" .TH "MEMKIND" 3 "2015-03-31" "Intel Corporation" "MEMKIND" \" -*- nroff -*- .SH "NAME" memkind \- Heap manager that enables allocations to memory with different properties. .br This header expose STANDARD and EXPERIMENTAL API. API Standards are described below in this man page. .SH "SYNOPSIS" .nf .B #include .sp .B Link with -lmemkind .br .SS "EXPERIMENTAL API:" .sp .B "HEAP MANAGEMENT:" .br .BI "int memkind_posix_memalign(memkind_t " "kind" ", void " "**memptr" ", size_t " "alignment" ", size_t " "size" ); .sp .B "KIND MANAGEMENT:" .br .BI "int memkind_create_kind(memkind_memtype_t " "memtype_flags" ", memkind_policy_t " "policy" ", memkind_bits_t " "flags" ", memkind_t " "*kind" ); .sp .SS "STANDARD API:" .sp .B "ERROR HANDLING:" .br .BI "void memkind_error_message(int " "err" ", char " "*msg" ", size_t " "size" ); .sp .B "LIBRARY VERSION:" .br .BI "int memkind_get_version();" .sp .B "HEAP MANAGEMENT:" .br .BI "void *memkind_malloc(memkind_t " "kind" ", size_t " "size" ); .br .BI "void *memkind_calloc(memkind_t " "kind" ", size_t " "num" ", size_t " "size" ); .br .BI "void *memkind_realloc(memkind_t " "kind" ", void " "*ptr" ", size_t " "size" ); .br .BI "void memkind_free(memkind_t " "kind" ", void " "*ptr" ); .br .BI "size_t memkind_malloc_usable_size(memkind_t " "kind" ", void " "*ptr" ); .br .BI "void *memkind_defrag_reallocate(memkind_t " "kind" ", void " "*ptr" ); .br .BI "memkind_t memkind_detect_kind(void " "*ptr" ); .sp .B "KIND CONFIGURATION MANAGEMENT:" .br .BI "struct memkind_config *memkind_config_new();" .br .BI "void memkind_config_delete(struct memkind_config " "*cfg" ); .br .BI "void memkind_config_set_path(struct memkind_config " "*cfg" ", const char " "*pmem_dir" ); .br .BI "void memkind_config_set_size(struct memkind_config " "*cfg" ", size_t " "pmem_size" ); .br .BI "void memkind_config_set_memory_usage_policy(struct memkind_config " "*cfg" ", memkind_mem_usage_policy " "policy" ); .sp .B "KIND MANAGEMENT:" .br .BI "int memkind_create_fixed(void " "*addr" ", size_t " "size" ", memkind_t " "*kind" ); .br .BI "int memkind_create_pmem(const char " "*dir" ", size_t " "max_size" ", memkind_t " "*kind" ); .br .BI "int memkind_create_pmem_with_config(struct memkind_config " "*cfg" ", memkind_t " "*kind" ); .br .BI "int memkind_destroy_kind(memkind_t " "kind" ); .br .BI "int memkind_check_available(memkind_t " "kind" ); .br .BI "ssize_t memkind_get_capacity(memkind_t " "kind" ); .br .BI "int memkind_check_dax_path(const char " "*pmem_dir" ); .sp .B "STATISTICS:" .br .BI "int memkind_update_cached_stats(void);" .br .BI "int memkind_get_stat(memkind_t " "kind" ", memkind_stat " "stat" ", size_t " "*value" ); .br .BI "int memkind_stats_print(void " "(*write_cb) (void *, const char *)" ", void " "*cbopaque" ", memkind_stat_print_opt " "opts" ); .sp .B "DECORATORS:" .br .BI "void memkind_malloc_pre(memkind_t " "*kind" ", size_t " "*size" ); .br .BI "void memkind_malloc_post(memkind_t " "kind" ", size_t " "size" ", void " "**result" ); .br .BI "void memkind_calloc_pre(memkind_t " "*kind" ", size_t " "*nmemb" ", size_t " "*size" ); .br .BI "void memkind_calloc_post(memkind_t " "kind" ", size_t " "nmemb" ", size_t " "size" ", void " "**result" ); .br .BI "void memkind_posix_memalign_pre(memkind_t " "*kind" ", void " "**memptr" ", size_t " "*alignment" ", size_t " "*size" ); .br .BI "void memkind_posix_memalign_post(memkind_t " "kind" ", void " "**memptr" ", size_t " "alignment" ", size_t " "size" ", int " "*err" ); .br .BI "void memkind_realloc_pre(memkind_t " "*kind" ", void " "**ptr" ", size_t " "*size" ); .br .BI "void memkind_realloc_post(memkind_t " "*kind" ", void " "*ptr" ", size_t " "size" ", void " "**result" ); .br .BI "void memkind_free_pre(memkind_t " "*kind" ", void " "**ptr" ); .br .BI "void memkind_free_post(memkind_t " "kind" ", void " "*ptr" ); .sp .B "ENHANCEMENTS:" .br .BI "int memkind_set_bg_threads(bool " "state" ); .sp .sp .br .SH "DESCRIPTION" .PP .BR memkind_error_message () converts an error number .I err returned by a member of the memkind interface to an error message .I msg where the maximum size of the message is passed by the .I size parameter. .B "HEAP MANAGEMENT:" .br The functions described in this section define a heap manager with an interface modeled on the ISO C standard API's, except that the user must specify the .I kind of memory with the first argument to each function. See the .B KINDS section below for a full description of the implemented kinds. For file-backed kind of memory see .BR memkind_create_pmem () or .BR memkind_create_pmem_with_config (). For memory kind created on user-specified area, please check .BR memkind_create_fixed (). .PP .BR memkind_malloc () allocates .I size bytes of uninitialized memory of the specified .IR "kind" . The allocated space is suitably aligned (after possible pointer coercion) for storage of any type of object. If .I size is 0, then .BR memkind_malloc () returns .IR "NULL" . .PP .BR memkind_calloc () allocates space for .I num objects each .I size bytes in length in memory of the specified .IR "kind" . The result is identical to calling .BR memkind_malloc () with an argument of .IR num * .IR "size" , with the exception that the allocated memory is explicitly initialized to zero bytes. If .I num or .I size is 0, then .BR memkind_calloc () returns .IR "NULL" . .PP .BR memkind_realloc () changes the size of the previously allocated memory referenced by .I ptr to .I size bytes of the specified .IR "kind" . The contents of the memory remain unchanged up to the lesser of the new and old sizes. If the new size is larger, the contents of the newly allocated portion of the memory are undefined. Upon success, the memory referenced by .I ptr is freed and a pointer to the newly allocated memory is returned. .BR Note: .BR memkind_realloc () may move the memory allocation, resulting in a different return value than .IR "ptr" . If .I ptr is .IR "NULL" , the .BR memkind_realloc () function behaves identically to .BR memkind_malloc () for the specified size. If .I size is equal to zero, and .I ptr is not .IR "NULL" , then the call is equivalent to .IR "memkind_free(kind, ptr)" and .I NULL is returned. The address .IR "ptr" , if not .IR "NULL" , must have been returned by a previous call to .BR memkind_malloc (), .BR memkind_calloc (), .BR memkind_realloc (), .BR memkind_defrag_reallocate () or .BR memkind_posix_memalign () with the same .I kind as specified to the call to .BR memkind_realloc (). Otherwise, if .I memkind_free(kind, ptr) was called before, undefined behavior occurs. In cases where the kind is unknown in the context of the call to .BR memkind_realloc () .I NULL can be given as the .I kind specified to .BR memkind_realloc (), but this will require an internal look up for correct kind. .BR Note: The look up for .I kind could result in serious performance penalty, which can be avoided by specifying a correct .IR kind . If .I kind is .I NULL and .I ptr is .IR "NULL" , then .BR memkind_realloc () returns .I NULL and sets .I errno to .BR EINVAL . .PP .BR memkind_posix_memalign () allocates .I size bytes of memory of a specified .I kind such that the allocation's base address is an even multiple of .IR "alignment" , and returns the allocation in the value pointed to by .IR "memptr" . The requested .I alignment must be a power of 2 at least as large as .IR "sizeof(void*)" . If .I size is 0, then .BR memkind_posix_memalign () returns 0, with a .I NULL returned in .IR "memptr" . .PP .BR memkind_malloc_usable_size () function provides the same semantics as .BR malloc_usable_size (3), but operates on specified .IR "kind" . .br .BR Note: In cases where the kind is unknown in the context of the call to .BR memkind_malloc_usable_size () .I NULL can be given as the .I kind specified to .BR memkind_malloc_usable_size (), but this could require a internal look up for correct kind. .BR memkind_malloc_usable_size () is supported by TBB heap manager described in .B ENVIRONMENT section since Intel TBB 2019 Update 4. .PP .BR memkind_defrag_reallocate () reallocates the object conditionally inside specific .IR "kind" . Function determines if it's worthwhile to move allocation to reduce degree of external fragmentation of the heap. In case of failure function returns .IR "NULL" , otherwise function returns a pointer to reallocated memory and memory referenced by .I ptr was released and should not be accessed. If .I ptr is .IR "NULL" , then .BR memkind_defrag_reallocate () returns .IR "NULL" . In cases where the kind is unknown in the context of the call to .BR memkind_defrag_reallocate () .I NULL can be given as the .I kind specified to .BR memkind_defrag_reallocate (), but this will require an internal look up for correct kind. .BR Note: The look up for .I kind could result in serious performance penalty, which can be avoided by specifying a correct .IR kind . .PP .BR memkind_detect_kind () returns the kind associated with allocated memory referenced by .IR ptr . This pointer must have been returned by a previous call to .BR memkind_malloc (), .BR memkind_calloc (), .BR memkind_realloc (), .BR memkind_defrag_reallocate () or .BR memkind_posix_memalign (). If .I ptr is .IR "NULL" , then .BR memkind_detect_kind () returns .IR "NULL" . .BR Note: This function has non-trivial performance overhead. .PP .BR memkind_free () causes the allocated memory referenced by .I ptr to be made available for future allocations. This pointer must have been returned by a previous call to .BR memkind_malloc (), .BR memkind_calloc (), .BR memkind_realloc (), .BR memkind_defrag_reallocate () or .BR memkind_posix_memalign (). Otherwise, if .I memkind_free(kind, ptr) was already called before, undefined behavior occurs. If .I ptr is .IR "NULL" , no operation is performed. In cases where the kind is unknown in the context of the call to .BR memkind_free () .I NULL can be given as the .I kind specified to .BR memkind_free (), but this will require an internal look up for correct kind. .BR Note: The look up for .I kind could result in serious performance penalty, which can be avoided by specifying a correct .IR kind . .sp .B "KIND CONFIGURATION MANAGEMENT:" .br The functions described in this section define a way to create, delete and update kind specific configuration. Except of .BR memkind_config_new (), user must specify the memkind configuration with the first argument to each function. API described here is most useful with file-backed kind of memory, e.g. .BR memkind_create_pmem_with_config () method. .PP .BR memkind_config_new () creates the memkind configuration. .PP .BR memkind_config_delete () deletes previously created memkind configuration, which must have been returned by a previous call to .BR memkind_config_new (). .PP .BR memkind_config_set_path () updates the memkind .IR pmem_dir configuration parameter, which specifies directory path, where file-backed kind of memory will be created. .BR Note: This function does not validate that .I pmem_dir specifies a valid path. .PP .BR memkind_config_set_size () updates the memkind .IR pmem_size configuration parameter, which allows to limit the file-backed kind memory partition. .BR Note: This function does not validate that .I pmem_size is in valid range. .PP .BR memkind_config_set_memory_usage_policy () updates the memkind .IR policy configuration parameter, which allows to tune up memory utilization. The user should set the value based on the characteristics of application that is using the library (e.g. prioritize memory usage, CPU utilization), for more details about .IR policy see the .BR "MEMORY USAGE POLICY" section below. .BR Note: This function does not validate that .I policy is in valid range. .sp .B "KIND MANAGEMENT:" .br There are built-in kinds that are always available and these are enumerated in the .B KINDS section. The user can also create their own kinds of memory. This section describes the API's that enable the tracking of the different kinds of memory and determining their properties. .PP .BR memkind_create_fixed () is a function used to create a kind under user-specified area of memory. The memory can be allocated in any possible way, e.g. it might be a static array or an mmapped area. User can specify any properties using functions such as mbind. User is also responsible for de-allocation of memory after the kind destruction. The memory area must remain valid until fixed_kind is destroyed. The area starts at address .IR addr and has size .IR size. When heap manager runs out of memory (located under user-specified area), a call to .BR memkind_malloc () returns .IR "NULL" and .BR errno is set to .BR ENOMEM. .PP .BR memkind_create_pmem () is a convenient function used to create a file-backed kind of memory. It allocates a temporary file in the given directory .IR dir . The file is created in a fashion similar to .BR tmpfile (3), so that the file name does not appear when the directory is listed and the space is automatically freed when the program terminates. The file is truncated to a size of .I max_size bytes and the resulting space is memory-mapped. .br Note that the actual file system space is not allocated immediately, but only on a call to .BR memkind_pmem_mmap () (see .BR memkind_pmem (3)). This allows to create a pmem memkind of a pretty large size without the need to reserve in advance the corresponding file system space for the entire heap. If the value of .I max_size equals 0, pmem memkind is only limited by the capacity of the file system mounted under .I dir argument. The minimum .I max_size value which allows to limit the size of kind by the library is defined as .BR MEMKIND_PMEM_MIN_SIZE . Calling .BR memkind_create_pmem () with a size smaller than that and different than 0 will return an error. The maximum allowed size is not limited by .BR memkind , but by the file system specified by the .I dir argument. The .I max_size passed in is the raw size of the memory pool and .B jemalloc will use some of that space for its own metadata. Returns zero if the pmem memkind is created successfully or an error code from the .B ERRORS section if not. .PP .BR memkind_create_pmem_with_config () is a second function used to create a file-backed kind of memory. Function behaves simillar to .BR memkind_create_pmem () but instead of passing .I dir and .I max_size arguments, it uses .I config param to specify characteristics of created file-backed kind of memory (see .B KIND CONFIGURATION MANAGEMENT section). .PP .BR memkind_create_kind () creates kind that allocates memory with specific memory type, memory binding policy and flags (see .B MEMORY FLAGS section). The .IR memtype_flags (see .B MEMORY TYPES section) determine memory types to allocate, .IR policy argument is policy for specifying page binding to memory types selected by .IR memtype_flags . Returns zero if the specified kind is created successfully or an error code from the .B ERRORS section if not. .PP .BR memkind_destroy_kind () destroys previously created kind object, which must have been returned by a previous call to .BR memkind_create_pmem (), .BR memkind_create_pmem_with_config () or .BR memkind_create_kind (). Otherwise, or if .I memkind_destroy_kind(kind) was already called before, undefined behavior occurs. Note that, when the kind was returned by .BR memkind_create_kind () all allocated memory must be freed before kind is destroyed, otherwise this will cause memory leak. When the kind was returned by .BR memkind_create_pmem () or .BR memkind_create_pmem_with_config () all allocated memory will be freed after kind will be destroyed. .PP .BR memkind_check_available () returns zero if the specified .I kind is available or an error code from the .B ERRORS section if it is not. .PP .BR memkind_get_capacity () returns memory capacity of nodes available to a given .I kind (file size or filesystem capacity in case of a file-backed PMEM kind; total area size in the case of fixed-kind) or -1 in case of an error. Supported kinds are: .B MEMKIND_DEFAULT, MEMKIND_HIGHEST_CAPACITY, MEMKIND_HIGHEST_CAPACITY_LOCAL, MEMKIND_LOWEST_LATENCY_LOCAL, .B MEMKIND_HIGHEST_BANDWIDTH_LOCAL, MEMKIND_HUGETLB, MEMKIND_INTERLEAVE, MEMKIND_HBW, .B MEMKIND_HBW_ALL, MEMKIND_HBW_INTERLEAVE, MEMKIND_DAX_KMEM, MEMKIND_DAX_KMEM_ALL, .B MEMKIND_DAX_KMEM_INTERLEAVE, MEMKIND_REGULAR , file-backed PMEM and fixed-kind. .I kind. For .B MEMKIND_HUGETLB only pages with a default size of 2MB are supported. .PP .BR memkind_check_dax_path () returns zero if file-backed kind memory is in the specified directory path .I pmem_dir can be created with the DAX attribute or an error code from the .B ERRORS section if it is not. .PP .BR MEMKIND_PMEM_MIN_SIZE The minimum size which allows to limit the file-backed memory partition. .sp .B "STATISTICS:" .br The functions described in this section define a way to get specific memory allocation statistics. .PP .BR memkind_update_cached_stats () is used to force an update of cached dynamic allocator statistics. Statistics are not updated real-time by memkind library and this method allows to force its update. .PP .BR memkind_get_stat () retrieves statistic of the specified type and returns it in .IR "value". For more details about .I stat see the .B "MEMORY STATISTICS TYPE" section below. Measured statistic applies to specific .IR "kind", when .I NULL is given as .I kind then statistic applies to memory used by the whole memkind library. .BR Note: You need to call .BR memkind_update_cached_stats () before calling .BR memkind_get_stat () because statistics are cached by memkind library. .PP .BR memkind_stats_print () prints summary statistics. This function wraps jemalloc's function .BR je_malloc_stats_print (). Uses .I write_cb function to print the output. While providing custom writer function, use .BR syscall(2) rather than .BR write(2). Pass .IR NULL in order to use the default .I write_cb function which prints the output to the stderr. Use .I cbopaque parameter in order to pass some data to your .I write_cb function. Pass additional options using .IR "opts". For more details on .I opts see the .B "MEMORY STATISTICS PRINT OPTIONS" section below. Returns MEMKIND_ERROR_INVALID when failed to parse options string, MEMKIND_SUCCESS on success. .PP .sp .B "DECORATORS:" .br The memkind library enables the user to define decorator functions that can be called before and after each memkind heap management API. The decorators that are called at the beginning of the function end are named after that function with .I _pre appended to the name and those that are called at the end of the function are named after that function with .I _post appended to the name. These are weak symbols and if they are not present at link time they are not called. The memkind library does not define these symbols which are reserved for user definition. These decorators can be used to track calls to the heap management interface or to modify parameters. The decorators that are called at the beginning of the allocator pass all inputs by reference and the decorators that are called at the end of the allocator pass the output by reference. This enables the modification of the input and output of each heap management function by the decorators. .sp .B "ENHANCEMENTS:" .br .BR memkind_set_bg_threads() enables/disables internal background worker threads in jemalloc. .sp .B "LIBRARY VERSION:" .br The memkind library version scheme consist major, minor and patch numbers separated by dot. Combining those numbers, we got the following representation: .br major.minor.patch, where: .br -major number is incremented whenever API is changed (loss of backward compatibility), .br -minor number is incremented whenever additional extensions are introduced or behavior has been changed, .br -patch number is incremented whenever small bug fixes are added. .sp memkind library provide numeric representation of the version by exposing the following API: .PP .BR memkind_get_version () returns version number represented by a single integer number, obtained from the formula: .br major * 1000000 + minor * 1000 + patch .sp .BR Note: major < 1 means unstable API. .sp API standards: .br -STANDARD API, API is considered as stable .br -NON-STANDARD API, API is considered as stable, however this is not a standard way to use memkind .br -EXPERIMENTAL API, API is considered as unstable and the subject to change .br .sp .SH "RETURN VALUE" .BR memkind_calloc (), .BR memkind_malloc (), .BR memkind_realloc () and .BR memkind_defrag_reallocate () returns the pointer to the allocated memory or .I NULL if the request fails. .BR memkind_malloc_usable_size () returns the number of usable bytes in the block of allocated memory pointed to by .IR "ptr" , a pointer to a block of memory allocated by .BR memkind_malloc () or a related function. If .I ptr is .IR "NULL" , 0 is returned. .BR memkind_free () and .BR memkind_error_message () do not have return values. All other memkind API's return 0 upon success and an error code defined in the .B ERRORS section upon failure. The memkind library avoids setting .I errno directly, but calls to underlying libraries and system calls may set .IR errno (e.g. .BR memkind_create_pmem ()). .SH "KINDS" The available kinds of memory: .TP .B MEMKIND_DEFAULT Default allocation using standard memory and default page size. .TP .B MEMKIND_HIGHEST_CAPACITY Allocate from a NUMA node(s) that has the highest capacity among all nodes in the system. .TP .B MEMKIND_HIGHEST_CAPACITY_PREFERRED Same as .B MEMKIND_HIGHEST_CAPACITY except that if there is not enough memory in the NUMA node that has the highest capacity in the local domain to satisfy the request, the allocation will fall back on other memory NUMA nodes. .BR Note: For this kind, the allocation will not succeed if there are two or more NUMA nodes that have the highest capacity. .TP .B MEMKIND_HIGHEST_CAPACITY_LOCAL Allocate from a NUMA node that has the highest capacity among all NUMA Nodes from the local domain. NUMA Nodes have the same local domain for a set of CPUs associated with them, e.g. socket or sub-NUMA cluster. .BR Note: If there are multiple NUMA nodes in the same local domain that have the highest capacity - allocation will be done from NUMA node with worse latency attribute. This kind requires locality information described in .B SYSTEM CONFIGURATION section. .TP .B MEMKIND_HIGHEST_CAPACITY_LOCAL_PREFERRED Same as .B MEMKIND_HIGHEST_CAPACITY_LOCAL except that if there is not enough memory in the NUMA node that has the highest capacity to satisfy the request, the allocation will fall back on other memory NUMA nodes. .TP .B MEMKIND_LOWEST_LATENCY_LOCAL Allocate from a NUMA node that has the lowest latency among all NUMA Nodes from the local domain. NUMA Nodes have the same local domain for a set of CPUs associated with them, e.g. socket or sub-NUMA cluster. .BR Note: If there are multiple NUMA nodes in the same local domain that have the lowest latency - allocation will be done from NUMA node with smaller memory capacity. This kind requires locality and memory performance characteristics information described in .B SYSTEM CONFIGURATION section. .TP .B MEMKIND_LOWEST_LATENCY_LOCAL_PREFERRED Same as .B MEMKIND_LOWEST_LATENCY_LOCAL except that if there is not enough memory in the NUMA node that has the lowest latency to satisfy the request, the allocation will fall back on other memory NUMA nodes. .TP .B MEMKIND_HIGHEST_BANDWIDTH_LOCAL Allocate from a NUMA node that has the highest bandwidth among all NUMA Nodes from the local domain. NUMA Nodes have the same local domain for a set of CPUs associated with them, e.g. socket or sub-NUMA cluster. .BR Note: If there are multiple NUMA nodes in the same local domain that have the highest bandwidth - allocation will be done from NUMA node with smaller memory capacity. This kind requires locality and memory performance characteristics information described in .B SYSTEM CONFIGURATION section. .TP .B MEMKIND_HIGHEST_BANDWIDTH_LOCAL_PREFERRED Same as .B MEMKIND_HIGHEST_BANDWIDTH_LOCAL except that if there is not enough memory in the NUMA node that has the highest bandwidth to satisfy the request, the allocation will fall back on other memory NUMA nodes. .TP .B MEMKIND_HUGETLB Allocate from standard memory using huge pages. .BR Note: This kind requires huge pages configuration described in .B SYSTEM CONFIGURATION section. .TP .B MEMKIND_GBTLB (DEPRECATED) Allocate from standard memory using 1GB chunks backed by huge pages. .BR Note: This kind requires huge pages configuration described in .B SYSTEM CONFIGURATION section. .TP .B MEMKIND_INTERLEAVE Allocate pages interleaved across all NUMA nodes with transparent huge pages disabled. .TP .B MEMKIND_HBW Allocate from the closest high bandwidth memory NUMA node(s) at the time of allocation. If there is not enough high bandwidth memory to satisfy the request .I errno is set to .B ENOMEM and the allocated pointer is set to .IR "NULL" . .BR Note: This kind requires memory performance characteristics information described in .B SYSTEM CONFIGURATION section. .TP .B MEMKIND_HBW_ALL Same as .B MEMKIND_HBW except decision regarding closest NUMA node(s) is postponed until the time of first write. .TP .B MEMKIND_HBW_HUGETLB Same as .B MEMKIND_HBW except the allocation is backed by huge pages. .BR Note: This kind requires huge pages configuration described in .B SYSTEM CONFIGURATION section. .TP .B MEMKIND_HBW_ALL_HUGETLB Combination of .B MEMKIND_HBW_ALL and .B MEMKIND_HBW_HUGETLB properties. .BR Note: This kind requires huge pages configuration described in .B SYSTEM CONFIGURATION section. .TP .B MEMKIND_HBW_PREFERRED Same as .B MEMKIND_HBW except that if there is not enough high bandwidth memory to satisfy the request, the allocation will fall back on standard memory. .BR Note: For this kind, the allocation will not succeed if two or more high bandwidth memory NUMA nodes are in the same shortest distance to the same CPU on which process is eligible to run. Check on that eligibility is done upon starting the application. .TP .B MEMKIND_HBW_PREFERRED_HUGETLB Same as .B MEMKIND_HBW_PREFERRED except the allocation is backed by huge pages. .BR Note: This kind requires huge pages configuration described in .B SYSTEM CONFIGURATION section. .TP .B MEMKIND_HBW_GBTLB (DEPRECATED) Same as .B MEMKIND_HBW except the allocation is backed by 1GB chunks of huge pages. Note that .I size can take on any value, but full gigabyte pages will allocated for each request, so remainder of the last page will be wasted. This kind requires huge pages configuration described in .B SYSTEM CONFIGURATION section. .TP .B MEMKIND_HBW_PREFERRED_GBTLB (DEPRECATED) Same as .B MEMKIND_HBW_GBTLB except that if there is not enough high bandwidth memory to satisfy the request, the allocation will fall back on standard memory. .BR Note: This kind requires huge pages configuration described in .B SYSTEM CONFIGURATION section. For this kind, the allocation will not succeed if two or more high bandwidth memory NUMA nodes are in the same shortest distance to the same CPU on which process is eligible to run. Check on that eligibility is done upon starting the application. .TP .B MEMKIND_HBW_INTERLEAVE Same as .B MEMKIND_HBW except that the pages that support the allocation are interleaved across all high bandwidth nodes and transparent huge pages are disabled. .TP .B MEMKIND_DAX_KMEM Allocate from the closest persistent memory NUMA node at the time of allocation. If there is not enough memory in the closest persistent memory NUMA node to satisfy the request .I errno is set to .B ENOMEM and the allocated pointer is set to .IR "NULL" . .TP .B MEMKIND_DAX_KMEM_ALL Allocate from the closest persistent memory NUMA node available at the time of allocation. If there is not enough memory on any of persistent memory NUMA nodes to satisfy the request .I errno is set to .B ENOMEM and the allocated pointer is set to .IR "NULL" . .TP .B MEMKIND_DAX_KMEM_PREFERRED Same as .B MEMKIND_DAX_KMEM except that if there is not enough memory in the closest persistent memory NUMA node to satisfy the request, the allocation will fall back on other memory NUMA nodes. .BR Note: For this kind, the allocation will not succeed if two or more persistent memory NUMA nodes are in the same shortest distance to the same CPU on which process is eligible to run. Check on that eligibility is done upon starting the application. .TP .B MEMKIND_DAX_KMEM_INTERLEAVE Same as .B MEMKIND_DAX_KMEM except that the pages that support the allocation are interleaved across all persistent memory NUMA nodes. .TP .B MEMKIND_REGULAR Allocate from regular memory using the default page size. Regular means general purpose memory from the NUMA nodes containing CPUs. .SH "MEMORY TYPES" The available types of memory: .TP .B MEMKIND_MEMTYPE_DEFAULT Standard memory, the same as process uses. .TP .B MEMKIND_MEMTYPE_HIGH_BANDWIDTH High bandwidth memory (HBM). There must be at least two memory types with different bandwidth to determine which is the HBM. .SH "MEMORY BINDING POLICY" The available types of memory binding policy: .TP .B MEMKIND_POLICY_BIND_LOCAL Allocate local memory. If there is not enough memory to satisfy the request .I errno is set to .BR ENOMEM and the allocated pointer is set to .IR "NULL" . .TP .B MEMKIND_POLICY_BIND_ALL Memory locality is ignored. If there is not enough memory to satisfy the request .I errno is set to .B ENOMEM and the allocated pointer is set to .IR "NULL" . .TP .B MEMKIND_POLICY_PREFERRED_LOCAL Allocate preferred memory that is local. If there is not enough preferred memory to satisfy the request or preferred memory is not available, the allocation will fall back on any other memory. .TP .B MEMKIND_POLICY_INTERLEAVE_LOCAL Interleave allocation across local memory. For n memory types the allocation will be interleaved across all of them. .TP .B MEMKIND_POLICY_INTERLEAVE_ALL Interleave allocation. Locality is ignored. For n memory types the allocation will be interleaved across all of them. .TP .B MEMKIND_POLICY_MAX_VALUE Max policy value. .SH "MEMORY FLAGS" The available types of memory flags: .TP .B MEMKIND_MASK_PAGE_SIZE_2MB Allocation backed by 2MB page size. .SH "MEMORY USAGE POLICY" The available types of memory usage policy: .TP .B MEMKIND_MEM_USAGE_POLICY_DEFAULT Default memory usage policy. .TP .B MEMKIND_MEM_USAGE_POLICY_CONSERVATIVE Conservative memory usage policy - prioritize memory usage at cost of performance. .BR Note: Memory usage policies have no effect for TBB heap manager described in .B ENVIRONMENT section. .SH "MEMORY STATISTICS TYPE" The available types of memory statistics: .TP .B MEMKIND_STAT_TYPE_RESIDENT Maximum number of bytes in physically resident data pages mapped. .TP .B MEMKIND_STAT_TYPE_ACTIVE Total number of bytes in active pages. .TP .B MEMKIND_STAT_TYPE_ALLOCATED Total number of allocated bytes. .SH "MEMORY STATISTICS PRINT OPTIONS" The available options for printing statistics: .TP .B MEMKIND_STAT_PRINT_ALL Print all statistics. .TP .B MEMKIND_STAT_PRINT_JSON_FORMAT Print statistics in JSON format. .TP .B MEMKIND_STAT_PRINT_OMIT_GENERAL Omit general information that never changes during execution. .TP .B MEMKIND_STAT_PRINT_OMIT_MERGED_ARENA Omit merged arena statistics. .TP .B MEMKIND_STAT_PRINT_OMIT_DESTROYED_MERGED_ARENA Omit destroyed merged arena statistics. .TP .B MEMKIND_STAT_PRINT_OMIT_PER_ARENA Omit per arena statistics. .TP .B MEMKIND_STAT_PRINT_OMIT_PER_SIZE_CLASS_BINS Omit per size class statistics for bins. .TP .B MEMKIND_STAT_PRINT_OMIT_PER_SIZE_CLASS_LARGE Omit per size class statistics for large objects. .TP .B MEMKIND_STAT_PRINT_OMIT_MUTEX Omit all mutex statistics. .TP .B MEMKIND_STAT_PRINT_OMIT_EXTENT Omit extent statistics. .SH "ERRORS" .TP .BR memkind_posix_memalign () returns the one of the POSIX standard error codes .B EINVAL or .B ENOMEM as defined in .I if an error occurs (these have positive values). If the .I alignment parameter is not a power of two or is not a multiple of .IR "sizeof(void*)" , then .B EINVAL is returned. If there is insufficient memory to satisfy the request then .B ENOMEM is returned. .PP All functions other than .BR memkind_posix_memalign () which have an integer return type return one of the negative error codes as defined in .I and described below. .TP .B MEMKIND_ERROR_UNAVAILABLE Requested memory kind is not available .TP .B MEMKIND_ERROR_MBIND Call to .BR mbind (2) failed .TP .B MEMKIND_ERROR_MMAP Call to .BR mmap (2) failed .TP .B MEMKIND_ERROR_MALLOC Call to jemalloc's .BR malloc () failed .TP .B MEMKIND_ERROR_ENVIRON Error parsing environment variable .I MEMKIND_* .TP .B MEMKIND_ERROR_INVALID Invalid input arguments to memkind routine .TP .B MEMKIND_ERROR_TOOMANY Error trying to initialize more than maximum .B MEMKIND_MAX_KIND number of kinds .TP .B MEMKIND_ERROR_BADOPS Error memkind operation structure is missing or invalid .TP .B MEMKIND_ERROR_HUGETLB Unable to allocate huge pages .TP .B MEMKIND_ERROR_MEMTYPE_NOT_AVAILABLE Error requested memory type is not available .TP .B MEMKIND_ERROR_OPERATION_FAILED Error memkind operation failed .TP .B MEMKIND_ERROR_ARENAS_CREATE Call to jemalloc's .BR arenas.create () failed .TP .B MEMKIND_ERROR_RUNTIME Unspecified run-time error .SH "FILES" .TP .I /usr/bin/memkind-hbw-nodes Prints a comma-separated list of high bandwidth nodes. .TP .I /usr/bin/memkind-auto-dax-kmem-nodes Prints a comma-separated list of persistent memory NUMA nodes, which are automatically detected. .SH "ENVIRONMENT" .TP .B MEMKIND_HBW_NODES This environment variable is a comma-separated list of NUMA nodes that are treated as high bandwidth. Uses the .I libnuma routine .BR numa_parse_nodestring () for parsing, so the syntax described in the .BR numa (3) man page for this routine applies: e.g. 1-3,5 is a valid setting. .TP .B MEMKIND_HBW_THRESHOLD This environment variable is bandwidth in MB/s that is the threshold for identifying high bandwidth memory. The default threshold is 204800 (200 GB/s), which is used if this variable is not set. When set, it must be greater than or equal to 0. .TP .B MEMKIND_DAX_KMEM_NODES This environment variable is a comma-separated list of NUMA nodes that are treated as PMEM memory. Uses the .I libnuma routine .BR numa_parse_nodestring () for parsing, so the syntax described in the .BR numa (3) man page for this routine applies: e.g. 1-3,5 is a valid setting. .TP .B MEMKIND_ARENA_NUM_PER_KIND This environment variable allows leveraging internal mechanism of the library for setting number of arenas per kind. Value should be a positive integer (not greater than .B INT_MAX defined in .IR ). The user should set the value based on the characteristics of application that is using the library. Higher value can provide better performance in extremely multithreaded applications at the cost of memory overhead. See section .BR "IMPLEMENTATION NOTES" of .BR jemalloc (3) for more details about arenas. .TP .B MEMKIND_HOG_MEMORY Controls behavior of memkind with regards to returning memory to underlying OS. Setting .B MEMKIND_HOG_MEMORY to 1 causes memkind to not release memory to OS in anticipation of memory reuse soon. This will improve latency of 'free' operations but increase memory usage. .BR Note: For file-backed kind memory will be released to OS only after calling .BR memkind_destroy_kind(), not after 'free' operations. In context of .B MEMKIND_MEM_USAGE_POLICY_CONSERVATIVE memory usage policy - it will also impact memory coalescing and results that blocks pages will be often reused (better memory usage at cost of performance). .TP .B MEMKIND_DEBUG Controls logging mechanism in memkind. Setting .B MEMKIND_DEBUG to 1 enables printing messages like errors and general information about environment to .IR stderr . .TP .B MEMKIND_BACKGROUND_THREAD_LIMIT Enable background worker threads. Value should be from range 0 to maximum number of cpus. Setting .B MEMKIND_BACKGROUND_THREAD_LIMIT to specific value will limit maximum number of background worker threads to this value. 0 means maximum number of background worker threads will be limited to maximum number of cpus. .TP .B MEMKIND_HEAP_MANAGER Controls heap management behavior in memkind library by switching to one of the available heap managers. .br Values: .br JEMALLOC - sets the jemalloc heap manager .br TBB - sets the Intel Threading Building Blocks heap manager. This option requires installed Intel Threading Building Blocks library. .PP If the .B MEMKIND_HEAP_MANAGER is not set then the jemalloc heap manager will be used by default. .SH "SYSTEM CONFIGURATION" Interfaces for obtaining 2MB (HUGETLB) memory need allocated huge pages in the kernel's huge page pool. .TP .B HUGETLB (huge pages) Current number of "persistent" huge pages can be read from .I /proc/sys/vm/nr_hugepages file. Proposed way of setting hugepages is: .BR "sudo sysctl vm.nr_hugepages=" . More information can be found here: .UR https://www.kernel.org/doc/Documentation/vm/hugetlbpage.txt .UE .PP Interfaces for obtaining locality information are provided by .I libhwloc dependency. Functionality based on locality requires that memkind library is configured and built with the support of .I libhwloc (./configure --enable-hwloc). .PP Interfaces for obtaining memory performance characteristics information are based on .I HMAT (Heterogeneous Memory Attribute Table) .UR https://uefi.org/sites/default/files/resources/ACPI_6_3_final_Jan30.pdf .UE Functionality based on memory performance characteristics requires that platform configuration fully supports HMAT and memkind library is configured and built with the support of .I libhwloc (./configure --enable-hwloc). .PP .BR Note: For a given target NUMA Node, the OS exposes only the performance characteristics of the best performing NUMA node. .PP .I libhwloc can be reached on: .UR https://www.open-mpi.org/projects/hwloc .UE .SH "STATIC LINKING" When linking statically against memkind, .I libmemkind.a should be used together with its dependencies .I libnuma and pthread. Pthread can be linked by adding .I /usr/lib64/libpthread.a as a dependency (exact path may vary). Typically .I libnuma will need to be compiled from sources to use it as a static dependency. .I libnuma can be reached on GitHub: .UR https://github.com/numactl/numactl .UE .SH "KNOWN ISSUES" .TP .B HUGETLB (huge pages) There might be some overhead in huge pages consumption caused by heap management. If your allocation fails because of OOM, please try to allocate extra huge pages (e.g. 8 huge pages). .SH "COPYRIGHT" Copyright (C) 2014 - 2021 Intel Corporation. All rights reserved. .SH "SEE ALSO" .BR malloc (3), .BR malloc_usable_size (3), .BR numa (3), .BR hwloc (3), .BR numactl (8), .BR mbind (2), .BR mmap (2), .BR move_pages (2), .BR jemalloc (3), .BR memkind_dax_kmem (3), .BR memkind_default (3), .BR memkind_arena (3), .BR memkind_fixed (3), .BR memkind_hbw (3), .BR memkind_hugetlb (3), .BR memkind_pmem (3), .BR syscall(2), .BR write(2)