bpf: implement numbers iterator

author Andrii Nakryiko <andrii@kernel.org>

Wed, 8 Mar 2023 18:41:17 +0000 (10:41 -0800)

committer Alexei Starovoitov <ast@kernel.org>

Thu, 9 Mar 2023 00:19:51 +0000 (16:19 -0800)
author Andrii Nakryiko <andrii@kernel.org>
Wed, 8 Mar 2023 18:41:17 +0000 (10:41 -0800)
committer Alexei Starovoitov <ast@kernel.org>
Thu, 9 Mar 2023 00:19:51 +0000 (16:19 -0800)
diff --git a/include/linux/bpf.h b/include/linux/bpf.h

index 6792a79..e64ff1e 100644 (file)
--- a/include/linux/bpf.h
+++ b/include/linux/bpf.h
@@ -1617,8 +1617,12 @@ struct bpf_array {
  #define BPF_COMPLEXITY_LIMIT_INSNS      1000000 /* yes. 1M insns */
  #define MAX_TAIL_CALL_CNT 33
  
-/* Maximum number of loops for bpf_loop */
-#define BPF_MAX_LOOPS  BIT(23)
+/* Maximum number of loops for bpf_loop and bpf_iter_num.
+ * It's enum to expose it (and thus make it discoverable) through BTF.
+ */
+enum {
+       BPF_MAX_LOOPS = 8 * 1024 * 1024,
+};
  
  #define BPF_F_ACCESS_MASK      (BPF_F_RDONLY |         \
                                  BPF_F_RDONLY_PROG |    \
diff --git a/include/uapi/linux/bpf.h b/include/uapi/linux/bpf.h

index 976b194..4abddb6 100644 (file)
--- a/include/uapi/linux/bpf.h
+++ b/include/uapi/linux/bpf.h
@@ -7112,4 +7112,12 @@ enum {
         BPF_F_TIMER_ABS = (1ULL << 0),
  };
  
+/* BPF numbers iterator state */
+struct bpf_iter_num {
+       /* opaque iterator state; having __u64 here allows to preserve correct
+        * alignment requirements in vmlinux.h, generated from BTF
+        */
+       __u64 __opaque[1];
+} __attribute__((aligned(8)));
+
  #endif /* _UAPI__LINUX_BPF_H__ */
diff --git a/kernel/bpf/bpf_iter.c b/kernel/bpf/bpf_iter.c

index 5dc307b..96856f1 100644 (file)
--- a/kernel/bpf/bpf_iter.c
+++ b/kernel/bpf/bpf_iter.c
@@ -776,3 +776,73 @@ const struct bpf_func_proto bpf_loop_proto = {
         .arg3_type      = ARG_PTR_TO_STACK_OR_NULL,
         .arg4_type      = ARG_ANYTHING,
  };
+
+struct bpf_iter_num_kern {
+       int cur; /* current value, inclusive */
+       int end; /* final value, exclusive */
+} __aligned(8);
+
+__diag_push();
+__diag_ignore_all("-Wmissing-prototypes",
+                 "Global functions as their definitions will be in vmlinux BTF");
+
+__bpf_kfunc int bpf_iter_num_new(struct bpf_iter_num *it, int start, int end)
+{
+       struct bpf_iter_num_kern *s = (void *)it;
+
+       BUILD_BUG_ON(sizeof(struct bpf_iter_num_kern) != sizeof(struct bpf_iter_num));
+       BUILD_BUG_ON(__alignof__(struct bpf_iter_num_kern) != __alignof__(struct bpf_iter_num));
+
+       BTF_TYPE_EMIT(struct btf_iter_num);
+
+       /* start == end is legit, it's an empty range and we'll just get NULL
+        * on first (and any subsequent) bpf_iter_num_next() call
+        */
+       if (start > end) {
+               s->cur = s->end = 0;
+               return -EINVAL;
+       }
+
+       /* avoid overflows, e.g., if start == INT_MIN and end == INT_MAX */
+       if ((s64)end - (s64)start > BPF_MAX_LOOPS) {
+               s->cur = s->end = 0;
+               return -E2BIG;
+       }
+
+       /* user will call bpf_iter_num_next() first,
+        * which will set s->cur to exactly start value;
+        * underflow shouldn't matter
+        */
+       s->cur = start - 1;
+       s->end = end;
+
+       return 0;
+}
+
+__bpf_kfunc int *bpf_iter_num_next(struct bpf_iter_num* it)
+{
+       struct bpf_iter_num_kern *s = (void *)it;
+
+       /* check failed initialization or if we are done (same behavior);
+        * need to be careful about overflow, so convert to s64 for checks,
+        * e.g., if s->cur == s->end == INT_MAX, we can't just do
+        * s->cur + 1 >= s->end
+        */
+       if ((s64)(s->cur + 1) >= s->end) {
+               s->cur = s->end = 0;
+               return NULL;
+       }
+
+       s->cur++;
+
+       return &s->cur;
+}
+
+__bpf_kfunc void bpf_iter_num_destroy(struct bpf_iter_num *it)
+{
+       struct bpf_iter_num_kern *s = (void *)it;
+
+       s->cur = s->end = 0;
+}
+
+__diag_pop();
diff --git a/kernel/bpf/helpers.c b/kernel/bpf/helpers.c

index 637ac4e..f9b7eee 100644 (file)
--- a/kernel/bpf/helpers.c
+++ b/kernel/bpf/helpers.c
@@ -2411,6 +2411,9 @@ BTF_ID_FLAGS(func, bpf_rcu_read_lock)
  BTF_ID_FLAGS(func, bpf_rcu_read_unlock)
  BTF_ID_FLAGS(func, bpf_dynptr_slice, KF_RET_NULL)
  BTF_ID_FLAGS(func, bpf_dynptr_slice_rdwr, KF_RET_NULL)
+BTF_ID_FLAGS(func, bpf_iter_num_new, KF_ITER_NEW)
+BTF_ID_FLAGS(func, bpf_iter_num_next, KF_ITER_NEXT | KF_RET_NULL)
+BTF_ID_FLAGS(func, bpf_iter_num_destroy, KF_ITER_DESTROY)
  BTF_SET8_END(common_btf_ids)
  
  static const struct btf_kfunc_id_set common_kfunc_set = {
diff --git a/tools/include/uapi/linux/bpf.h b/tools/include/uapi/linux/bpf.h

index 976b194..4abddb6 100644 (file)
--- a/tools/include/uapi/linux/bpf.h
+++ b/tools/include/uapi/linux/bpf.h
@@ -7112,4 +7112,12 @@ enum {
         BPF_F_TIMER_ABS = (1ULL << 0),
  };
  
+/* BPF numbers iterator state */
+struct bpf_iter_num {
+       /* opaque iterator state; having __u64 here allows to preserve correct
+        * alignment requirements in vmlinux.h, generated from BTF
+        */
+       __u64 __opaque[1];
+} __attribute__((aligned(8)));
+
  #endif /* _UAPI__LINUX_BPF_H__ */
author	Andrii Nakryiko <andrii@kernel.org>
	Wed, 8 Mar 2023 18:41:17 +0000 (10:41 -0800)
committer	Alexei Starovoitov <ast@kernel.org>
	Thu, 9 Mar 2023 00:19:51 +0000 (16:19 -0800)
include/linux/bpf.h		patch \| blob \| history
include/uapi/linux/bpf.h		patch \| blob \| history
kernel/bpf/bpf_iter.c		patch \| blob \| history
kernel/bpf/helpers.c		patch \| blob \| history
tools/include/uapi/linux/bpf.h		patch \| blob \| history