mm: generic adaptive large memory allocation APIs [Kernel]

Prev: Your Webmail Quota Has Exceeded The Set Quota Please Upgrade
Next: staging: hv: Add Time Sync feature to hv_utils module

From: Changli Gao on 5 May 2010 20:40

On Thu, May 6, 2010 at 8:30 AM, Changli Gao <xiaosuo(a)gmail.com> wrote:
> kvmalloc() will try to allocate physically contiguous memory first, and try
> vmalloc to allocate virtually contiguous memory when the former allocation
> fails.
>
> kvfree() is used to free the memory allocated by kvmalloc(). It can't be used
> in atomic context. If the callers are in atomic contex, they can use
> kvfree_inatomic() instead.
>
> There is much duplicate code to do such things in kernel, so I generate the
> above APIs.
>
> Thank Eric Dumazet for the "kv" prefix. :)
>
> #include <linux/kernel.h>
> #include <linux/module.h>
> #include <linux/mm.h>
> #include <linux/init.h>
> #include <linux/slab.h>
> #include <linux/vmalloc.h>
> #include <linux/interrupt.h>
>
> void *kvmalloc(size_t size)
> {
> Â Â Â Â void *ptr;
>
> Â Â Â Â if (size < PAGE_SIZE)
> Â Â Â Â Â Â Â Â return kmalloc(PAGE_SIZE, GFP_KERNEL);
> Â Â Â Â ptr = alloc_pages_exact(size, GFP_KERNEL | __GFP_NOWARN);
> Â Â Â Â if (ptr != NULL)
> Â Â Â Â Â Â Â Â return ptr;
>
> Â Â Â Â return vmalloc(size);
> }
> EXPORT_SYMBOL(kvmalloc);
>
> void kvfree(void *ptr, size_t size)
> {
> Â Â Â Â if (size < PAGE_SIZE)
> Â Â Â Â Â Â Â Â kfree(ptr);
> Â Â Â Â else if (is_vmalloc_addr(ptr))
> Â Â Â Â Â Â Â Â vfree(ptr);
> Â Â Â Â else
> Â Â Â Â Â Â Â Â free_pages_exact(ptr, size);
> }
> EXPORT_SYMBOL(kvfree);
>
> struct kvfree_work_struct {
> Â Â Â Â struct work_struct Â Â Â work;
> Â Â Â Â void Â Â Â Â Â Â Â Â Â Â *head;
> Â Â Â Â void Â Â Â Â Â Â Â Â Â Â **ptail;
> };
>
> DEFINE_PER_CPU(struct kvfree_work_struct, kvfree_work_struct);
>
> static void kvfree_work(struct work_struct *_work)
> {
> Â Â Â Â struct kvfree_work_struct *work;
> Â Â Â Â void *head, *tmp;
>
> Â Â Â Â work = container_of(_work, struct kvfree_work_struct, work);
> Â Â Â Â local_bh_disable();
> Â Â Â Â head = work->head;
> Â Â Â Â work->head = NULL;
> Â Â Â Â work->ptail = &work->head;
> Â Â Â Â local_bh_enable();

local_bh_disable should be local_irq_disable(), and local_bh_enable()
should be local_irq_enable().

>
> Â Â Â Â while (head) {
> Â Â Â Â Â Â Â Â tmp = head;
> Â Â Â Â Â Â Â Â head = *(void **)head;
> Â Â Â Â Â Â Â Â vfree(tmp);
> Â Â Â Â }
> }
>
> void kvfree_inatomic(void *ptr, size_t size)
> {
> Â Â Â Â if (size < PAGE_SIZE) {
> Â Â Â Â Â Â Â Â kfree(ptr);
> Â Â Â Â } else if (is_vmalloc_addr(ptr)) {
> Â Â Â Â Â Â Â Â struct kvfree_work_struct *work;
>
> Â Â Â Â Â Â Â Â *(void **)ptr = NULL;
> Â Â Â Â Â Â Â Â local_irq_disable();
> Â Â Â Â Â Â Â Â work = this_cpu_ptr(&kvfree_work_struct);
> Â Â Â Â Â Â Â Â *(work->ptail) = ptr;
> Â Â Â Â Â Â Â Â work->ptail = (void**)ptr;
> Â Â Â Â Â Â Â Â schedule_work(&work->work);
> Â Â Â Â Â Â Â Â local_irq_enable();
> Â Â Â Â } else {
> Â Â Â Â Â Â Â Â free_pages_exact(ptr, size);
> Â Â Â Â }
> }
> EXPORT_SYMBOL(kvfree_inatomic);
>
> static int kvfree_work_struct_init(void)
> {
> Â Â Â Â int cpu;
> Â Â Â Â struct kvfree_work_struct *work;
>
> Â Â Â Â for_each_possible_cpu(cpu) {
> Â Â Â Â Â Â Â Â work = per_cpu_ptr(&kvfree_work_struct, cpu);
> Â Â Â Â Â Â Â Â INIT_WORK(&work->work, kvfree_work);
> Â Â Â Â Â Â Â Â work->head = NULL;
> Â Â Â Â Â Â Â Â work->ptail = &work->head;
> Â Â Â Â }
>
> Â Â Â Â return 0;
> }
> //pure_initcall(kvfree_work_struct_init);
>
> //--------------------
> // for testing
> static int test_init(void)
> {
> Â Â Â Â int size;
> Â Â Â Â void *ptr;
>
> Â Â Â Â kvfree_work_struct_init();
> Â Â Â Â for (size = 1; size < (1<<30); size <<= 1) {
> Â Â Â Â Â Â Â Â ptr = kvmalloc(size);
> Â Â Â Â Â Â Â Â if (is_vmalloc_addr(ptr)) {
> Â Â Â Â Â Â Â Â Â Â Â Â printk("%d\n", size);
> Â Â Â Â Â Â Â Â Â Â Â Â break;
> Â Â Â Â Â Â Â Â }
> Â Â Â Â Â Â Â Â kvfree(ptr, size);
> Â Â Â Â }
>
> Â Â Â Â return 0;
> }
> module_init(test_init);
>
> static void test_exit(void)
> {
> Â Â Â Â int cpu;
> Â Â Â Â struct kvfree_work_struct *work;
>
> Â Â Â Â for_each_possible_cpu(cpu) {
> Â Â Â Â Â Â Â Â work = per_cpu_ptr(&kvfree_work_struct, cpu);
> Â Â Â Â Â Â Â Â cancel_work_sync(&work->work);
> Â Â Â Â }
> }
> module_exit(test_exit);
>
> MODULE_LICENSE("GPL");
>

--
Regardsï¼
Changli Gao(xiaosuo(a)gmail.com)

From: Changli Gao on 5 May 2010 21:30

From: Tetsuo Handa on 5 May 2010 23:20

Changli Gao wrote:
> struct kvfree_work_struct {
> struct work_struct work;
> void *head;
> void **ptail;
> };

I wonder why "struct kvfree_work_struct" is needed.
According to http://kernel.ubuntu.com/git?p=jj/ubuntu-lucid.git;a=blobdiff;f=security/apparmor/match.c;h=d2cd55419acfcae85cb748c8f837a4384a3a0d29;hp=afc2dd2260edffcf88521ae86458ad03aa8ea12c;hb=f5eba4b0a01cc671affa429ba1512b6de7caeb5b;hpb=abdff9ddaf2644d0f9962490f73e030806ba90d3 ,

static void kvfree_work(struct work_struct *work)
{
vfree(work);
}

void kvfree_inatomic(void *ptr, size_t size)
{
if (size < PAGE_SIZE) {
kfree(ptr);
} else if (is_vmalloc_addr(ptr)) {
/*
* We can embed "struct work_struct" inside *ptr
* because size >= PAGE_SIZE.
*/
struct work_struct *work = ptr;
BUILD_BUG_ON(sizeof(struct work_struct) > PAGE_SIZE);
INIT_WORK(&work, kvfree_work);
schedule_work(&work);
} else {
free_pages_exact(ptr, size);
}
}

should do what you want. (Though, I didn't test it.)
--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo(a)vger.kernel.org
More majordomo info at http://vger.kernel.org/majordomo-info.html
Please read the FAQ at http://www.tux.org/lkml/

From: Changli Gao on 5 May 2010 23:30

2010/5/6 Tetsuo Handa <penguin-kernel(a)i-love.sakura.ne.jp>:
> Changli Gao wrote:
>> struct kvfree_work_struct {
>> struct work_struct work;
>> void *head;
>> void **ptail;
>> };
>
> I wonder why "struct kvfree_work_struct" is needed.
> According to http://kernel.ubuntu.com/git?p=jj/ubuntu-lucid.git;a=blobdiff;f=security/apparmor/match.c;h=d2cd55419acfcae85cb748c8f837a4384a3a0d29;hp=afc2dd2260edffcf88521ae86458ad03aa8ea12c;hb=f5eba4b0a01cc671affa429ba1512b6de7caeb5b;hpb=abdff9ddaf2644d0f9962490f73e030806ba90d3 ,
>
> static void kvfree_work(struct work_struct *work)
> {
> vfree(work);
> }
>
> void kvfree_inatomic(void *ptr, size_t size)
> {
> if (size < PAGE_SIZE) {
> kfree(ptr);
> } else if (is_vmalloc_addr(ptr)) {
> /*
> * We can embed "struct work_struct" inside *ptr
> * because size >= PAGE_SIZE.
> */
> struct work_struct *work = ptr;
> BUILD_BUG_ON(sizeof(struct work_struct) > PAGE_SIZE);
> INIT_WORK(&work, kvfree_work);
> schedule_work(&work);

&work should be work. It is a much better idea. thanks very much.

> } else {
> free_pages_exact(ptr, size);
> }
> }
>
> should do what you want. (Though, I didn't test it.)
>

--
Regards，
Changli Gao(xiaosuo(a)gmail.com)
--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo(a)vger.kernel.org
More majordomo info at http://vger.kernel.org/majordomo-info.html
Please read the FAQ at http://www.tux.org/lkml/

From: Jamie Lokier on 6 May 2010 11:40

Changli Gao wrote:
> kvmalloc() will try to allocate physically contiguous memory first, and try
> vmalloc to allocate virtually contiguous memory when the former allocation
> fails.

Note that converting users from vmalloc() to kvmalloc() may increase
fragmentation problems for other parts of the kernel, because it will
tend to use up more of the available large blocks. Especially users
who allocate large blocks and often. That's worth a mention
somewhere.

On the other hand, this API could make it easier to convert some kmalloc()
calls to kvmalloc(), reducing fragmentation problems. :-)

Since the caller is indicating they don't mind which happens, then
anti-fragmentation heuristics (such as checking watermarks) could be
added to kvmalloc() at some future time, if needed.

-- Jamie
--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo(a)vger.kernel.org
More majordomo info at http://vger.kernel.org/majordomo-info.html
Please read the FAQ at http://www.tux.org/lkml/

| Next | Last
Pages: 1 2 3 4
Prev: Your Webmail Quota Has Exceeded The Set Quota Please Upgrade
Next: staging: hv: Add Time Sync feature to hv_utils module