2005-06-22 07:15:02 +07:00
|
|
|
/*
|
2011-07-13 12:14:24 +07:00
|
|
|
* Basic general purpose allocator for managing special purpose
|
|
|
|
* memory, for example, memory that is not managed by the regular
|
|
|
|
* kmalloc/kfree interface. Uses for this includes on-device special
|
|
|
|
* memory, uncached memory etc.
|
|
|
|
*
|
|
|
|
* It is safe to use the allocator in NMI handlers and other special
|
|
|
|
* unblockable contexts that could otherwise deadlock on locks. This
|
|
|
|
* is implemented by using atomic operations and retries on any
|
|
|
|
* conflicts. The disadvantage is that there may be livelocks in
|
|
|
|
* extreme cases. For better scalability, one allocator can be used
|
|
|
|
* for each CPU.
|
|
|
|
*
|
|
|
|
* The lockless operation only works if there is enough memory
|
|
|
|
* available. If new memory is added to the pool a lock has to be
|
|
|
|
* still taken. So any user relying on locklessness has to ensure
|
|
|
|
* that sufficient memory is preallocated.
|
|
|
|
*
|
|
|
|
* The basic atomic operation of this allocator is cmpxchg on long.
|
|
|
|
* On architectures that don't have NMI-safe cmpxchg implementation,
|
|
|
|
* the allocator can NOT be used in NMI handler. So code uses the
|
|
|
|
* allocator in NMI handler should depend on
|
|
|
|
* CONFIG_ARCH_HAVE_NMI_SAFE_CMPXCHG.
|
2005-06-22 07:15:02 +07:00
|
|
|
*
|
|
|
|
* This source code is licensed under the GNU General Public License,
|
|
|
|
* Version 2. See the file COPYING for more details.
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
2011-05-25 07:13:33 +07:00
|
|
|
#ifndef __GENALLOC_H__
|
|
|
|
#define __GENALLOC_H__
|
2013-04-30 06:17:10 +07:00
|
|
|
|
2014-01-24 06:53:18 +07:00
|
|
|
#include <linux/spinlock_types.h>
|
|
|
|
|
2013-04-30 06:17:10 +07:00
|
|
|
struct device;
|
|
|
|
struct device_node;
|
|
|
|
|
genalloc: make it possible to use a custom allocation algorithm
Premit use of another algorithm than the default first-fit one. For
example a custom algorithm could be used to manage alignment requirements.
As I can't predict all the possible requirements/needs for all allocation
uses cases, I add a "free" field 'void *data' to pass any needed
information to the allocation function. For example 'data' could be used
to handle a structure where you store the alignment, the expected memory
bank, the requester device, or any information that could influence the
allocation algorithm.
An usage example may look like this:
struct my_pool_constraints {
int align;
int bank;
...
};
unsigned long my_custom_algo(unsigned long *map, unsigned long size,
unsigned long start, unsigned int nr, void *data)
{
struct my_pool_constraints *constraints = data;
...
deal with allocation contraints
...
return the index in bitmap where perform the allocation
}
void create_my_pool()
{
struct my_pool_constraints c;
struct gen_pool *pool = gen_pool_create(...);
gen_pool_add(pool, ...);
gen_pool_set_algo(pool, my_custom_algo, &c);
}
Add of best-fit algorithm function:
most of the time best-fit is slower then first-fit but memory fragmentation
is lower. The random buffer allocation/free tests don't show any arithmetic
relation between the allocation time and fragmentation but the
best-fit algorithm
is sometime able to perform the allocation when the first-fit can't.
This new algorithm help to remove static allocations on ESRAM, a small but
fast on-chip RAM of few KB, used for high-performance uses cases like DMA
linked lists, graphic accelerators, encoders/decoders. On the Ux500
(in the ARM tree) we have define 5 ESRAM banks of 128 KB each and use of
static allocations becomes unmaintainable:
cd arch/arm/mach-ux500 && grep -r ESRAM .
./include/mach/db8500-regs.h:/* Base address and bank offsets for ESRAM */
./include/mach/db8500-regs.h:#define U8500_ESRAM_BASE 0x40000000
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK_SIZE 0x00020000
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK0 U8500_ESRAM_BASE
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK1 (U8500_ESRAM_BASE + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK2 (U8500_ESRAM_BANK1 + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK3 (U8500_ESRAM_BANK2 + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK4 (U8500_ESRAM_BANK3 + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_DMA_LCPA_OFFSET 0x10000
./include/mach/db8500-regs.h:#define U8500_DMA_LCPA_BASE
(U8500_ESRAM_BANK0 + U8500_ESRAM_DMA_LCPA_OFFSET)
./include/mach/db8500-regs.h:#define U8500_DMA_LCLA_BASE U8500_ESRAM_BANK4
I want to use genalloc to do dynamic allocations but I need to be able to
fine tune the allocation algorithm. I my case best-fit algorithm give
better results than first-fit, but it will not be true for every use case.
Signed-off-by: Benjamin Gaignard <benjamin.gaignard@stericsson.com>
Cc: Huang Ying <ying.huang@intel.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2012-10-05 07:13:20 +07:00
|
|
|
/**
|
|
|
|
* Allocation callback function type definition
|
|
|
|
* @map: Pointer to bitmap
|
|
|
|
* @size: The bitmap size in bits
|
|
|
|
* @start: The bitnumber to start searching at
|
|
|
|
* @nr: The number of zeroed bits we're looking for
|
|
|
|
* @data: optional additional data used by @genpool_algo_t
|
|
|
|
*/
|
|
|
|
typedef unsigned long (*genpool_algo_t)(unsigned long *map,
|
|
|
|
unsigned long size,
|
|
|
|
unsigned long start,
|
|
|
|
unsigned int nr,
|
|
|
|
void *data);
|
|
|
|
|
2005-06-22 07:15:02 +07:00
|
|
|
/*
|
2006-06-23 16:03:21 +07:00
|
|
|
* General purpose special memory pool descriptor.
|
2005-06-22 07:15:02 +07:00
|
|
|
*/
|
2006-06-23 16:03:21 +07:00
|
|
|
struct gen_pool {
|
2011-07-13 12:14:24 +07:00
|
|
|
spinlock_t lock;
|
2006-06-23 16:03:21 +07:00
|
|
|
struct list_head chunks; /* list of chunks in this pool */
|
|
|
|
int min_alloc_order; /* minimum allocation order */
|
genalloc: make it possible to use a custom allocation algorithm
Premit use of another algorithm than the default first-fit one. For
example a custom algorithm could be used to manage alignment requirements.
As I can't predict all the possible requirements/needs for all allocation
uses cases, I add a "free" field 'void *data' to pass any needed
information to the allocation function. For example 'data' could be used
to handle a structure where you store the alignment, the expected memory
bank, the requester device, or any information that could influence the
allocation algorithm.
An usage example may look like this:
struct my_pool_constraints {
int align;
int bank;
...
};
unsigned long my_custom_algo(unsigned long *map, unsigned long size,
unsigned long start, unsigned int nr, void *data)
{
struct my_pool_constraints *constraints = data;
...
deal with allocation contraints
...
return the index in bitmap where perform the allocation
}
void create_my_pool()
{
struct my_pool_constraints c;
struct gen_pool *pool = gen_pool_create(...);
gen_pool_add(pool, ...);
gen_pool_set_algo(pool, my_custom_algo, &c);
}
Add of best-fit algorithm function:
most of the time best-fit is slower then first-fit but memory fragmentation
is lower. The random buffer allocation/free tests don't show any arithmetic
relation between the allocation time and fragmentation but the
best-fit algorithm
is sometime able to perform the allocation when the first-fit can't.
This new algorithm help to remove static allocations on ESRAM, a small but
fast on-chip RAM of few KB, used for high-performance uses cases like DMA
linked lists, graphic accelerators, encoders/decoders. On the Ux500
(in the ARM tree) we have define 5 ESRAM banks of 128 KB each and use of
static allocations becomes unmaintainable:
cd arch/arm/mach-ux500 && grep -r ESRAM .
./include/mach/db8500-regs.h:/* Base address and bank offsets for ESRAM */
./include/mach/db8500-regs.h:#define U8500_ESRAM_BASE 0x40000000
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK_SIZE 0x00020000
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK0 U8500_ESRAM_BASE
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK1 (U8500_ESRAM_BASE + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK2 (U8500_ESRAM_BANK1 + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK3 (U8500_ESRAM_BANK2 + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK4 (U8500_ESRAM_BANK3 + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_DMA_LCPA_OFFSET 0x10000
./include/mach/db8500-regs.h:#define U8500_DMA_LCPA_BASE
(U8500_ESRAM_BANK0 + U8500_ESRAM_DMA_LCPA_OFFSET)
./include/mach/db8500-regs.h:#define U8500_DMA_LCLA_BASE U8500_ESRAM_BANK4
I want to use genalloc to do dynamic allocations but I need to be able to
fine tune the allocation algorithm. I my case best-fit algorithm give
better results than first-fit, but it will not be true for every use case.
Signed-off-by: Benjamin Gaignard <benjamin.gaignard@stericsson.com>
Cc: Huang Ying <ying.huang@intel.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2012-10-05 07:13:20 +07:00
|
|
|
|
|
|
|
genpool_algo_t algo; /* allocation function */
|
|
|
|
void *data;
|
2005-06-22 07:15:02 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
2006-06-23 16:03:21 +07:00
|
|
|
* General purpose special memory pool chunk descriptor.
|
2005-06-22 07:15:02 +07:00
|
|
|
*/
|
2006-06-23 16:03:21 +07:00
|
|
|
struct gen_pool_chunk {
|
|
|
|
struct list_head next_chunk; /* next chunk in pool */
|
2011-07-13 12:14:24 +07:00
|
|
|
atomic_t avail;
|
2011-05-25 07:13:34 +07:00
|
|
|
phys_addr_t phys_addr; /* physical starting address of memory chunk */
|
2013-09-12 04:21:43 +07:00
|
|
|
unsigned long start_addr; /* start address of memory chunk */
|
|
|
|
unsigned long end_addr; /* end address of memory chunk (inclusive) */
|
2006-06-23 16:03:21 +07:00
|
|
|
unsigned long bits[0]; /* bitmap for allocating memory chunk */
|
2005-06-22 07:15:02 +07:00
|
|
|
};
|
|
|
|
|
2006-06-23 16:03:21 +07:00
|
|
|
extern struct gen_pool *gen_pool_create(int, int);
|
2011-05-25 07:13:34 +07:00
|
|
|
extern phys_addr_t gen_pool_virt_to_phys(struct gen_pool *pool, unsigned long);
|
|
|
|
extern int gen_pool_add_virt(struct gen_pool *, unsigned long, phys_addr_t,
|
|
|
|
size_t, int);
|
|
|
|
/**
|
|
|
|
* gen_pool_add - add a new chunk of special memory to the pool
|
|
|
|
* @pool: pool to add new memory chunk to
|
|
|
|
* @addr: starting address of memory chunk to add to pool
|
|
|
|
* @size: size in bytes of the memory chunk to add to pool
|
|
|
|
* @nid: node id of the node the chunk structure and bitmap should be
|
|
|
|
* allocated on, or -1
|
|
|
|
*
|
|
|
|
* Add a new chunk of special memory to the specified pool.
|
|
|
|
*
|
|
|
|
* Returns 0 on success or a -ve errno on failure.
|
|
|
|
*/
|
|
|
|
static inline int gen_pool_add(struct gen_pool *pool, unsigned long addr,
|
|
|
|
size_t size, int nid)
|
|
|
|
{
|
|
|
|
return gen_pool_add_virt(pool, addr, -1, size, nid);
|
|
|
|
}
|
2006-10-02 16:17:00 +07:00
|
|
|
extern void gen_pool_destroy(struct gen_pool *);
|
2006-06-23 16:03:21 +07:00
|
|
|
extern unsigned long gen_pool_alloc(struct gen_pool *, size_t);
|
2013-11-13 06:09:52 +07:00
|
|
|
extern void *gen_pool_dma_alloc(struct gen_pool *pool, size_t size,
|
|
|
|
dma_addr_t *dma);
|
2006-06-23 16:03:21 +07:00
|
|
|
extern void gen_pool_free(struct gen_pool *, unsigned long, size_t);
|
2011-07-13 12:14:24 +07:00
|
|
|
extern void gen_pool_for_each_chunk(struct gen_pool *,
|
|
|
|
void (*)(struct gen_pool *, struct gen_pool_chunk *, void *), void *);
|
|
|
|
extern size_t gen_pool_avail(struct gen_pool *);
|
|
|
|
extern size_t gen_pool_size(struct gen_pool *);
|
genalloc: make it possible to use a custom allocation algorithm
Premit use of another algorithm than the default first-fit one. For
example a custom algorithm could be used to manage alignment requirements.
As I can't predict all the possible requirements/needs for all allocation
uses cases, I add a "free" field 'void *data' to pass any needed
information to the allocation function. For example 'data' could be used
to handle a structure where you store the alignment, the expected memory
bank, the requester device, or any information that could influence the
allocation algorithm.
An usage example may look like this:
struct my_pool_constraints {
int align;
int bank;
...
};
unsigned long my_custom_algo(unsigned long *map, unsigned long size,
unsigned long start, unsigned int nr, void *data)
{
struct my_pool_constraints *constraints = data;
...
deal with allocation contraints
...
return the index in bitmap where perform the allocation
}
void create_my_pool()
{
struct my_pool_constraints c;
struct gen_pool *pool = gen_pool_create(...);
gen_pool_add(pool, ...);
gen_pool_set_algo(pool, my_custom_algo, &c);
}
Add of best-fit algorithm function:
most of the time best-fit is slower then first-fit but memory fragmentation
is lower. The random buffer allocation/free tests don't show any arithmetic
relation between the allocation time and fragmentation but the
best-fit algorithm
is sometime able to perform the allocation when the first-fit can't.
This new algorithm help to remove static allocations on ESRAM, a small but
fast on-chip RAM of few KB, used for high-performance uses cases like DMA
linked lists, graphic accelerators, encoders/decoders. On the Ux500
(in the ARM tree) we have define 5 ESRAM banks of 128 KB each and use of
static allocations becomes unmaintainable:
cd arch/arm/mach-ux500 && grep -r ESRAM .
./include/mach/db8500-regs.h:/* Base address and bank offsets for ESRAM */
./include/mach/db8500-regs.h:#define U8500_ESRAM_BASE 0x40000000
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK_SIZE 0x00020000
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK0 U8500_ESRAM_BASE
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK1 (U8500_ESRAM_BASE + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK2 (U8500_ESRAM_BANK1 + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK3 (U8500_ESRAM_BANK2 + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_BANK4 (U8500_ESRAM_BANK3 + U8500_ESRAM_BANK_SIZE)
./include/mach/db8500-regs.h:#define U8500_ESRAM_DMA_LCPA_OFFSET 0x10000
./include/mach/db8500-regs.h:#define U8500_DMA_LCPA_BASE
(U8500_ESRAM_BANK0 + U8500_ESRAM_DMA_LCPA_OFFSET)
./include/mach/db8500-regs.h:#define U8500_DMA_LCLA_BASE U8500_ESRAM_BANK4
I want to use genalloc to do dynamic allocations but I need to be able to
fine tune the allocation algorithm. I my case best-fit algorithm give
better results than first-fit, but it will not be true for every use case.
Signed-off-by: Benjamin Gaignard <benjamin.gaignard@stericsson.com>
Cc: Huang Ying <ying.huang@intel.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2012-10-05 07:13:20 +07:00
|
|
|
|
|
|
|
extern void gen_pool_set_algo(struct gen_pool *pool, genpool_algo_t algo,
|
|
|
|
void *data);
|
|
|
|
|
|
|
|
extern unsigned long gen_pool_first_fit(unsigned long *map, unsigned long size,
|
|
|
|
unsigned long start, unsigned int nr, void *data);
|
|
|
|
|
|
|
|
extern unsigned long gen_pool_best_fit(unsigned long *map, unsigned long size,
|
|
|
|
unsigned long start, unsigned int nr, void *data);
|
|
|
|
|
2013-04-30 06:17:10 +07:00
|
|
|
extern struct gen_pool *devm_gen_pool_create(struct device *dev,
|
|
|
|
int min_alloc_order, int nid);
|
|
|
|
extern struct gen_pool *dev_get_gen_pool(struct device *dev);
|
|
|
|
|
|
|
|
#ifdef CONFIG_OF
|
|
|
|
extern struct gen_pool *of_get_named_gen_pool(struct device_node *np,
|
|
|
|
const char *propname, int index);
|
|
|
|
#else
|
|
|
|
static inline struct gen_pool *of_get_named_gen_pool(struct device_node *np,
|
|
|
|
const char *propname, int index)
|
|
|
|
{
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
#endif
|
2011-05-25 07:13:33 +07:00
|
|
|
#endif /* __GENALLOC_H__ */
|