kernel_samsung_sm7125

jenna

History

Sultan Alsawaf 690fe03782 scatterlist: Don't allocate sg lists using __get_free_page Allocating pages with __get_free_page is slower than going through the slab allocator to grab free pages out from a pool. These are the results from running the code at the bottom of this message: [ 1.278602] speedtest: __get_free_page: 9 us [ 1.278606] speedtest: kmalloc: 4 us [ 1.278609] speedtest: kmem_cache_alloc: 4 us [ 1.278611] speedtest: vmalloc: 13 us kmalloc and kmem_cache_alloc (which is what kmalloc uses for common sizes behind the scenes) are the fastest choices. Use kmalloc to speed up sg list allocation. This is the code used to produce the above measurements: #include <linux/kthread.h> #include <linux/slab.h> #include <linux/vmalloc.h> static int speedtest(void data) { static const struct sched_param sched_max_rt_prio = { .sched_priority = MAX_RT_PRIO - 1 }; volatile s64 ctotal = 0, gtotal = 0, ktotal = 0, vtotal = 0; struct kmem_cache page_pool; int i, j, trials = 1000; volatile ktime_t start; void ptr[100]; sched_setscheduler_nocheck(current, SCHED_FIFO, &sched_max_rt_prio); page_pool = kmem_cache_create("pages", PAGE_SIZE, PAGE_SIZE, SLAB_PANIC, NULL); for (i = 0; i < trials; i++) { start = ktime_get(); for (j = 0; j < ARRAY_SIZE(ptr); j++) while (!(ptr[j] = kmem_cache_alloc(page_pool, GFP_KERNEL))); ctotal += ktime_us_delta(ktime_get(), start); for (j = 0; j < ARRAY_SIZE(ptr); j++) kmem_cache_free(page_pool, ptr[j]); start = ktime_get(); for (j = 0; j < ARRAY_SIZE(ptr); j++) while (!(ptr[j] = (void )__get_free_page(GFP_KERNEL))); gtotal += ktime_us_delta(ktime_get(), start); for (j = 0; j < ARRAY_SIZE(ptr); j++) free_page((unsigned long)ptr[j]); start = ktime_get(); for (j = 0; j < ARRAY_SIZE(ptr); j++) while (!(ptr[j] = kmalloc(PAGE_SIZE, GFP_KERNEL))); ktotal += ktime_us_delta(ktime_get(), start); for (j = 0; j < ARRAY_SIZE(ptr); j++) kfree(ptr[j]); start = ktime_get(); ptr = vmalloc(ARRAY_SIZE(ptr) PAGE_SIZE); vtotal += ktime_us_delta(ktime_get(), start); vfree(*ptr); } kmem_cache_destroy(page_pool); printk("%s: __get_free_page: %lld us\n", __func__, gtotal / trials); printk("%s: kmalloc: %lld us\n", __func__, ktotal / trials); printk("%s: kmem_cache_alloc: %lld us\n", __func__, ctotal / trials); printk("%s: vmalloc: %lld us\n", __func__, vtotal / trials); complete(data); return 0; } static int __init start_test(void) { DECLARE_COMPLETION_ONSTACK(done); BUG_ON(IS_ERR(kthread_run(speedtest, &done, "malloc_test"))); wait_for_completion(&done); return 0; } late_initcall(start_test); Signed-off-by: Sultan Alsawaf <sultan@kerneltoast.com> Signed-off-by: Ruchit <ruchitmarathe@gmail.com>		5 months ago
..
842	…
fonts	…
lz4	…
lzo	…
mpi	…
raid6	…
reed_solomon	…
xz	…
zlib_deflate	…
zlib_inflate	…
zstd	…
.gitignore	…
Kconfig	…
Kconfig.debug	…
Kconfig.kasan	…
Kconfig.kgdb	…
Kconfig.ubsan	…
Makefile	…
argv_split.c	…
asn1_decoder.c	…
assoc_array.c	…
atomic64.c	…
atomic64_test.c	…
audit.c	…
bcd.c	…
bch.c	…
bitmap.c	…
bitrev.c	…
bsearch.c	…
btree.c	…
bug.c	…
build_OID_registry	…
bust_spinlocks.c	…
chacha.c	…
check_signature.c	…
checksum.c	…
clz_ctz.c	…
clz_tab.c	…
cmdline.c	…
compat_audit.c	…
cordic.c	…
cpu_rmap.c	…
cpumask.c	…
crc-ccitt.c	…
crc-itu-t.c	…
crc-t10dif.c	…
crc4.c	…
crc7.c	…
crc8.c	…
crc16.c	…
crc32.c	…
crc32defs.h	…
crc32test.c	…
ctype.c	…
debug_info.c	…
debug_locks.c	…
debugobjects.c	…
dec_and_lock.c	…
decompress.c	…
decompress_bunzip2.c	…
decompress_inflate.c	…
decompress_unlz4.c	…
decompress_unlzma.c	…
decompress_unlzo.c	…
decompress_unxz.c	…
devres.c	…
digsig.c	…
div64.c	…
dma-debug.c	…
dma-noop.c	…
dma-virt.c	…
dump_stack.c	…
dynamic_debug.c	…
dynamic_queue_limits.c	…
earlycpio.c	…
errseq.c	…
extable.c	…
fault-inject.c	…
fdt.c	…
fdt_empty_tree.c	…
fdt_ro.c	…
fdt_rw.c	…
fdt_strerror.c	…
fdt_sw.c	…
fdt_wip.c	…
find_bit.c	…
flex_array.c	…
flex_proportions.c	…
gcd.c	…
gen_crc32table.c	…
genalloc.c	…
glob.c	…
globtest.c	…
hexdump.c	…
hweight.c	…
idr.c	…
inflate.c	…
int_sqrt.c	…
interval_tree.c	…
interval_tree_test.c	…
iomap.c	…
iomap_copy.c	…
iommu-common.c	…
iommu-helper.c	…
ioremap.c	…
iov_iter.c	…
irq_poll.c	…
irq_regs.c	…
is_single_threaded.c	…
jedec_ddr_data.c	…
kasprintf.c	…
kfifo.c	…
klist.c	…
kobject.c	…
kobject_uevent.c	…
kstrtox.c	…
kstrtox.h	…
lcm.c	…
libcrc32c.c	…
list_debug.c	…
list_sort.c	…
llist.c	…
locking-selftest-hardirq.h	…
locking-selftest-mutex.h	…
locking-selftest-rlock-hardirq.h	…
locking-selftest-rlock-softirq.h	…
locking-selftest-rlock.h	…
locking-selftest-rsem.h	…
locking-selftest-rtmutex.h	…
locking-selftest-softirq.h	…
locking-selftest-spin-hardirq.h	…
locking-selftest-spin-softirq.h	…
locking-selftest-spin.h	…
locking-selftest-wlock-hardirq.h	…
locking-selftest-wlock-softirq.h	…
locking-selftest-wlock.h	…
locking-selftest-wsem.h	…
locking-selftest.c	…
lockref.c	…
lru_cache.c	…
memory-notifier-error-inject.c	…
memweight.c	…
net_utils.c	…
netdev-notifier-error-inject.c	…
nlattr.c	…
nmi_backtrace.c	…
nodemask.c	…
notifier-error-inject.c	…
notifier-error-inject.h	…
of-reconfig-notifier-error-inject.c	…
oid_registry.c	…
once.c	…
parman.c	…
parser.c	…
pci_iomap.c	…
percpu-refcount.c	…
percpu_counter.c	…
percpu_ida.c	…
percpu_test.c	…
plist.c	…
pm-notifier-error-inject.c	…
prime_numbers.c	…
radix-tree.c	…
random32.c	…
ratelimit.c	…
rational.c	…
rbtree.c	…
rbtree_test.c	…
reciprocal_div.c	…
refcount.c	…
rhashtable.c	…
sbitmap.c	…
scatterlist.c	scatterlist: Don't allocate sg lists using __get_free_page	5 months ago
seq_buf.c	…
sg_pool.c	…
sg_split.c	…
sha1.c	…
show_mem.c	…
siphash.c	…
smp_processor_id.c	…
sort.c	…
stackdepot.c	…
stmp_device.c	…
string.c	…
string_helpers.c	…
strncpy_from_user.c	…
strnlen_user.c	…
swiotlb.c	…
syscall.c	…
test-kstrtox.c	…
test-string_helpers.c	…
test_bitmap.c	…
test_bpf.c	…
test_debug_virtual.c	…
test_firmware.c	…
test_hash.c	…
test_hexdump.c	…
test_kasan.c	…
test_kmod.c	…
test_list_sort.c	…
test_meminit.c	…
test_module.c	…
test_parman.c	…
test_printf.c	…
test_rhashtable.c	…
test_siphash.c	…
test_sort.c	…
test_stackinit.c	…
test_static_key_base.c	…
test_static_keys.c	…
test_sysctl.c	…
test_user_copy.c	…
test_uuid.c	…
textsearch.c	…
timerqueue.c	…
ts_bm.c	…
ts_fsm.c	…
ts_kmp.c	…
ubsan.c	…
ubsan.h	…
ucs2_string.c	…
usercopy.c	…
uuid.c	…
vsprintf.c	…
win_minmax.c	…
xxhash.c	…