Re: [PATCH] bpf: Separate bpf_local_storage_lookup() fast and slow paths

31 Jan 2024

diff --git a/include/linux/bpf_local_storage.h b/include/linux/bpf_local_storage.h
index 173ec7f43ed1..c8cecf7fff87 100644
--- a/include/linux/bpf_local_storage.h
+++ b/include/linux/bpf_local_storage.h
@@ -130,9 +130,24 @@ bpf_local_storage_map_alloc(union bpf_attr *attr,
                          bool bpf_ma);
struct bpf_local_storage_data *
+bpf_local_storage_lookup_slowpath(struct bpf_local_storage *local_storage,

                          struct bpf_local_storage_map *smap,


                          bool cacheit_lockit);



+static inline struct bpf_local_storage_data *
  bpf_local_storage_lookup(struct bpf_local_storage *local_storage,
                       struct bpf_local_storage_map *smap,

                 bool cacheit_lockit);




                 bool cacheit_lockit)



+{

struct bpf_local_storage_data *sdata;



/* Fast path (cache hit) */


sdata = rcu_dereference_check(local_storage->cache[smap->cache_idx],


                              bpf_rcu_lock_held());


if (likely(sdata && rcu_access_pointer(sdata->smap) == smap))


        return sdata;



return bpf_local_storage_lookup_slowpath(local_storage, smap, cacheit_lockit);



+}
void bpf_local_storage_destroy(struct bpf_local_storage *local_storage);
diff --git a/kernel/bpf/bpf_local_storage.c b/kernel/bpf/bpf_local_storage.c
index 146824cc9689..2ef782a1bd6f 100644
--- a/kernel/bpf/bpf_local_storage.c
+++ b/kernel/bpf/bpf_local_storage.c
@@ -415,20 +415,14 @@ void bpf_selem_unlink(struct bpf_local_storage_elem *selem, bool reuse_now)
  }
/* If cacheit_lockit is false, this lookup function is lockless */
-struct bpf_local_storage_data *
-bpf_local_storage_lookup(struct bpf_local_storage *local_storage,

                 struct bpf_local_storage_map *smap,


                 bool cacheit_lockit)



+noinline struct bpf_local_storage_data *
Is noinline needed ?
Yes, so that this TU or LTO kernels do not inline the slowpath, which
would cause worse codegen in the caller.
...
...
+bpf_local_storage_lookup_slowpath(struct bpf_local_storage *local_storage,

                          struct bpf_local_storage_map *smap,


                          bool cacheit_lockit)

{
    struct bpf_local_storage_data *sdata;
    struct bpf_local_storage_elem *selem;


/* Fast path (cache hit) */


sdata = rcu_dereference_check(local_storage->cache[smap->cache_idx],


                              bpf_rcu_lock_held());


if (sdata && rcu_access_pointer(sdata->smap) == smap)


        return sdata;


/* Slow path (cache miss) */
hlist_for_each_entry_rcu(selem, &local_storage->list, snode,
                          rcu_read_lock_trace_held())



diff --git a/tools/testing/selftests/bpf/progs/cgrp_ls_recursion.c b/tools/testing/selftests/bpf/progs/cgrp_ls_recursion.c
index a043d8fefdac..9895087a9235 100644
--- a/tools/testing/selftests/bpf/progs/cgrp_ls_recursion.c
+++ b/tools/testing/selftests/bpf/progs/cgrp_ls_recursion.c
@@ -21,7 +21,7 @@ struct {
      __type(value, long);
  } map_b SEC(".maps");
-SEC("fentry/bpf_local_storage_lookup")
+SEC("fentry/bpf_local_storage_lookup_slowpath")
The selftest is trying to catch recursion. The change here cannot test the same
thing because the slowpath will never be hit in the test_progs.  I don't have a
better idea for now also.
It has a conflict with the bpf-next tree also. Was the patch created against an
internal tree?
Base was v6.7. I will do a rebase and rerun benchmarks.

    

2025

2024

2023

2022

2021

2020

2019

2018

2017

Re: [PATCH] bpf: Separate bpf_local_storage_lookup() fast and slow paths

Signed-off-by: Marco Elver elver@google.com