From 50dba771f519cb41a4b21052ba8261dafe8c8f01 Mon Sep 17 00:00:00 2001
From: Kernel Patches Daemon <kernel-patches-bot@fb.com>
Date: Tue, 18 Mar 2025 19:20:07 -0700
Subject: [PATCH 1/6] adding ci files

---
 .../veristat_baseline_compare/action.yml      |  49 +
 .github/scripts/compare-veristat-results.sh   |  18 +
 .github/scripts/download-gcc-bpf.sh           |  30 +
 .github/scripts/matrix.py                     | 194 ++++
 .../scripts/tests/test_veristat_compare.py    |  75 ++
 .github/scripts/tmpfsify-workspace.sh         |  21 +
 .github/scripts/veristat_compare.py           | 263 +++++
 .github/workflows/gcc-bpf.yml                 | 100 ++
 .github/workflows/kernel-build-test.yml       | 147 +++
 .github/workflows/kernel-build.yml            | 191 ++++
 .github/workflows/kernel-test.yml             |  88 ++
 .github/workflows/lint.yml                    |  65 ++
 .github/workflows/test.yml                    |  64 ++
 .github/workflows/veristat-kernel.yml         |  65 ++
 .github/workflows/veristat-meta.yml           |  87 ++
 README                                        |  18 -
 ci/diffs/.keep                                |   0
 ...-unnecessary-audit-log-for-CPU-secur.patch |  33 +
 ...e-SPECULATION_MITIGATIONS-to-arch-Kc.patch |  69 ++
 ...lftest-failures-due-to-llvm18-change.patch |  94 ++
 ...er-bug-due-to-incorrect-branch-offse.patch |  67 ++
 ...-bpf-Fix-a-btf_dump-selftest-failure.patch |  40 +
 ...sockopt_lock_sock-in-ip_sock_set_tos.patch |  99 ++
 ...lter-out-_GNU_SOURCE-when-compiling-.patch |  51 +
 ...x-bpf_cookie-and-find_vma-in-nested-.patch |  50 +
 ...x-pyperf180-compilation-failure-with.patch |  78 ++
 ...sable-detection-of-llvm-when-buildin.patch |  41 +
 ...x-inet_csk_accept-prototype-in-test_.patch |  32 +
 ...f-work-around-latest-Clang-smartness.patch |  31 +
 ...kxceiver-ksft_print_msg-fix-format-t.patch |  89 ++
 ...s-compilation-to-non-host-endianness.patch | 142 +++
 ...Fix-symbol-counting-logic-by-looking.patch |  65 ++
 ...s-compilation-to-non-host-endianness.patch | 117 +++
 ci/diffs/0099-s390x_nolockdep.diff            |  48 +
 ci/diffs/0099-selftest-cross-compile.diff     |  13 +
 ...ancing-slot-in-iter_folioq_get_pages.patch |  46 +
 ...lftests-bpf-Fix-uprobe-consumer-test.patch |  58 ++
 ...ext-fix-build-after-renames-in-sched.patch | 231 +++++
 ...-samples-bpf-fix-samples-compilation.patch |  61 ++
 ...to-remove-ftrace_test_recursion_tryl.patch |  46 +
 ...g-Define-ftrace_get_symaddr-for-s390.patch |  28 +
 ...dd-fno-strict-aliasing-to-BPF_CFLAGS.patch |  75 ++
 ...d-std-gnu11-to-BPF_CFLAGS-and-CFLAGS.patch |  63 ++
 ...g-NETFS_RREQ_ALL_QUEUED-to-be-after-.patch | 100 ++
 ...nvalid-irq-restore-in-scx_ops_bypass.patch |  56 ++
 ...99-scx-Fix-maximal-BPF-selftest-prog.patch |  56 ++
 ci/vmtest/configs/DENYLIST                    |  15 +
 ci/vmtest/configs/DENYLIST.aarch64            |   4 +
 ci/vmtest/configs/DENYLIST.rc                 |   3 +
 ci/vmtest/configs/DENYLIST.s390x              |  11 +
 ci/vmtest/configs/DENYLIST.test_progs-bpf_gcc | 904 ++++++++++++++++++
 ci/vmtest/configs/DENYLIST.x86_64             |   1 +
 ci/vmtest/configs/run-vmtest.env              |  42 +
 ci/vmtest/configs/run_veristat.kernel.cfg     |   4 +
 ci/vmtest/configs/run_veristat.meta.cfg       |   4 +
 ci/vmtest/configs/veristat_meta.cfg           |  10 +
 56 files changed, 4434 insertions(+), 18 deletions(-)
 create mode 100644 .github/actions/veristat_baseline_compare/action.yml
 create mode 100755 .github/scripts/compare-veristat-results.sh
 create mode 100755 .github/scripts/download-gcc-bpf.sh
 create mode 100644 .github/scripts/matrix.py
 create mode 100644 .github/scripts/tests/test_veristat_compare.py
 create mode 100755 .github/scripts/tmpfsify-workspace.sh
 create mode 100644 .github/scripts/veristat_compare.py
 create mode 100644 .github/workflows/gcc-bpf.yml
 create mode 100644 .github/workflows/kernel-build-test.yml
 create mode 100644 .github/workflows/kernel-build.yml
 create mode 100644 .github/workflows/kernel-test.yml
 create mode 100644 .github/workflows/lint.yml
 create mode 100644 .github/workflows/test.yml
 create mode 100644 .github/workflows/veristat-kernel.yml
 create mode 100644 .github/workflows/veristat-meta.yml
 create mode 100644 ci/diffs/.keep
 create mode 100644 ci/diffs/0001-Revert-bpf-Avoid-unnecessary-audit-log-for-CPU-secur.patch
 create mode 100644 ci/diffs/0001-arch-Kconfig-Move-SPECULATION_MITIGATIONS-to-arch-Kc.patch
 create mode 100644 ci/diffs/0001-bpf-Fix-a-few-selftest-failures-due-to-llvm18-change.patch
 create mode 100644 ci/diffs/0001-bpf-Fix-a-verifier-bug-due-to-incorrect-branch-offse.patch
 create mode 100644 ci/diffs/0001-bpf-next-selftests-bpf-Fix-a-btf_dump-selftest-failure.patch
 create mode 100644 ci/diffs/0001-net-bpf-Use-sockopt_lock_sock-in-ip_sock_set_tos.patch
 create mode 100644 ci/diffs/0001-selftests-bpf-Filter-out-_GNU_SOURCE-when-compiling-.patch
 create mode 100644 ci/diffs/0001-selftests-bpf-Fix-bpf_cookie-and-find_vma-in-nested-.patch
 create mode 100644 ci/diffs/0001-selftests-bpf-Fix-pyperf180-compilation-failure-with.patch
 create mode 100644 ci/diffs/0001-selftests-bpf-disable-detection-of-llvm-when-buildin.patch
 create mode 100644 ci/diffs/0001-selftests-bpf-fix-inet_csk_accept-prototype-in-test_.patch
 create mode 100644 ci/diffs/0001-selftests-bpf-work-around-latest-Clang-smartness.patch
 create mode 100644 ci/diffs/0001-selftests-bpf-xskxceiver-ksft_print_msg-fix-format-t.patch
 create mode 100644 ci/diffs/0001-tools-resolve_btfids-fix-cross-compilation-to-non-host-endianness.patch
 create mode 100644 ci/diffs/0001-tracing-kprobes-Fix-symbol-counting-logic-by-looking.patch
 create mode 100644 ci/diffs/0002-tools-resolve_btfids-fix-cross-compilation-to-non-host-endianness.patch
 create mode 100644 ci/diffs/0099-s390x_nolockdep.diff
 create mode 100644 ci/diffs/0099-selftest-cross-compile.diff
 create mode 100644 ci/diffs/0199-iov_iter-fix-advancing-slot-in-iter_folioq_get_pages.patch
 create mode 100644 ci/diffs/0299-selftests-bpf-Fix-uprobe-consumer-test.patch
 create mode 100644 ci/diffs/0399-selftests-sched_ext-fix-build-after-renames-in-sched.patch
 create mode 100644 ci/diffs/0499-samples-bpf-fix-samples-compilation.patch
 create mode 100644 ci/diffs/2000-s390-fgraph-Fix-to-remove-ftrace_test_recursion_tryl.patch
 create mode 100644 ci/diffs/2001-s390-tracing-Define-ftrace_get_symaddr-for-s390.patch
 create mode 100644 ci/diffs/2001-selftests-bpf-add-fno-strict-aliasing-to-BPF_CFLAGS.patch
 create mode 100644 ci/diffs/2002-selftests-bpf-add-std-gnu11-to-BPF_CFLAGS-and-CFLAGS.patch
 create mode 100644 ci/diffs/8888-netfs-Fix-setting-NETFS_RREQ_ALL_QUEUED-to-be-after-.patch
 create mode 100644 ci/diffs/9998-sched_ext-Fix-invalid-irq-restore-in-scx_ops_bypass.patch
 create mode 100644 ci/diffs/9999-scx-Fix-maximal-BPF-selftest-prog.patch
 create mode 100644 ci/vmtest/configs/DENYLIST
 create mode 100644 ci/vmtest/configs/DENYLIST.aarch64
 create mode 100644 ci/vmtest/configs/DENYLIST.rc
 create mode 100644 ci/vmtest/configs/DENYLIST.s390x
 create mode 100644 ci/vmtest/configs/DENYLIST.test_progs-bpf_gcc
 create mode 100644 ci/vmtest/configs/DENYLIST.x86_64
 create mode 100644 ci/vmtest/configs/run-vmtest.env
 create mode 100644 ci/vmtest/configs/run_veristat.kernel.cfg
 create mode 100644 ci/vmtest/configs/run_veristat.meta.cfg
 create mode 100644 ci/vmtest/configs/veristat_meta.cfg

diff --git a/.github/actions/veristat_baseline_compare/action.yml b/.github/actions/veristat_baseline_compare/action.yml
new file mode 100644
index 0000000000000..4a24166a97a9a
--- /dev/null
+++ b/.github/actions/veristat_baseline_compare/action.yml
@@ -0,0 +1,49 @@
+name: 'run-veristat'
+description: 'Run veristat benchmark'
+inputs:
+  veristat_output:
+    description: 'Veristat output filepath'
+    required: true
+  baseline_name:
+    description: 'Veristat baseline cache name'
+    required: true
+runs:
+  using: "composite"
+  steps:
+    - uses: actions/upload-artifact@v4
+      with:
+        name: ${{ inputs.baseline_name }}
+        if-no-files-found: error
+        path: ${{ github.workspace }}/${{ inputs.veristat_output }}
+
+    # For pull request:
+    # - get baseline log from cache
+    # - compare it to current run
+    - if: ${{ github.event_name == 'pull_request' }}
+      uses: actions/cache/restore@v4
+      with:
+        key: ${{ inputs.baseline_name }}-${{ github.base_ref }}
+        restore-keys: |
+          ${{ inputs.baseline_name }}-
+        path: '${{ github.workspace }}/${{ inputs.baseline_name }}'
+
+    - if: ${{ github.event_name == 'pull_request' }}
+      name: Show veristat comparison
+      shell: bash
+      run: ./.github/scripts/compare-veristat-results.sh
+      env:
+        BASELINE_PATH: ${{ github.workspace }}/${{ inputs.baseline_name }}
+        VERISTAT_OUTPUT: ${{ inputs.veristat_output }}
+
+    # For push: just put baseline log to cache
+    - if: ${{ github.event_name == 'push' }}
+      shell: bash
+      run: |
+        mv "${{ github.workspace }}/${{ inputs.veristat_output }}" \
+           "${{ github.workspace }}/${{ inputs.baseline_name }}"
+
+    - if: ${{ github.event_name == 'push' }}
+      uses: actions/cache/save@v4
+      with:
+        key: ${{ inputs.baseline_name }}-${{ github.ref_name }}-${{ github.run_id }}
+        path: '${{ github.workspace }}/${{ inputs.baseline_name }}'
diff --git a/.github/scripts/compare-veristat-results.sh b/.github/scripts/compare-veristat-results.sh
new file mode 100755
index 0000000000000..f95c3c192d80d
--- /dev/null
+++ b/.github/scripts/compare-veristat-results.sh
@@ -0,0 +1,18 @@
+#!/bin/bash
+
+if [[ ! -f "${BASELINE_PATH}" ]]; then
+    echo "# No ${BASELINE_PATH} available" >> "${GITHUB_STEP_SUMMARY}"
+
+    echo "No ${BASELINE_PATH} available"
+    echo "Printing veristat results"
+    cat "${VERISTAT_OUTPUT}"
+
+    exit
+fi
+
+selftests/bpf/veristat \
+    --output-format csv \
+    --emit file,prog,verdict,states \
+    --compare "${BASELINE_PATH}" "${VERISTAT_OUTPUT}" > compare.csv
+
+python3 ./.github/scripts/veristat_compare.py compare.csv
diff --git a/.github/scripts/download-gcc-bpf.sh b/.github/scripts/download-gcc-bpf.sh
new file mode 100755
index 0000000000000..894584a01b2ec
--- /dev/null
+++ b/.github/scripts/download-gcc-bpf.sh
@@ -0,0 +1,30 @@
+#!/bin/bash
+
+set -euo pipefail
+
+GCC_BPF_RELEASE_GH_REPO=$1
+INSTALL_DIR=$(realpath $2)
+
+cd /tmp
+
+tag=$(gh release list -L 1 -R ${GCC_BPF_RELEASE_GH_REPO} --json tagName -q .[].tagName)
+if [[ -z "$tag" ]]; then
+    echo "Could not find latest GCC BPF release at ${GCC_BPF_RELEASE_GH_REPO}"
+    exit 1
+fi
+
+url="https://github.com/${GCC_BPF_RELEASE_GH_REPO}/releases/download/${tag}/${tag}.tar.zst"
+echo "Downloading $url"
+wget -q "$url"
+
+tarball=${tag}.tar.zst
+dir=$(tar tf $tarball | head -1 || true)
+
+echo "Extracting $tarball ..."
+tar -I zstd -xf $tarball && rm -f $tarball
+
+rm -rf $INSTALL_DIR
+mv -v $dir $INSTALL_DIR
+
+cd -
+
diff --git a/.github/scripts/matrix.py b/.github/scripts/matrix.py
new file mode 100644
index 0000000000000..9f4f5bbe23a15
--- /dev/null
+++ b/.github/scripts/matrix.py
@@ -0,0 +1,194 @@
+#!/usr/bin/env python3
+
+import os
+import dataclasses
+import json
+
+from enum import Enum
+from typing import Any, Dict, List, Final, Set, Union
+
+MANAGED_OWNER: Final[str] = "kernel-patches"
+MANAGED_REPOS: Final[Set[str]] = {
+    f"{MANAGED_OWNER}/bpf",
+    f"{MANAGED_OWNER}/vmtest",
+}
+
+DEFAULT_SELF_HOSTED_RUNNER_TAGS: Final[List[str]] = ["self-hosted", "docker-noble-main"]
+DEFAULT_RUNNER: Final[str] = "ubuntu-24.04"
+DEFAULT_LLVM_VERSION: Final[int] = 17
+
+
+class Arch(str, Enum):
+    """
+    CPU architecture supported by CI.
+    """
+
+    AARCH64 = "aarch64"
+    S390X = "s390x"
+    X86_64 = "x86_64"
+
+
+class Compiler(str, Enum):
+    GCC = "gcc"
+    LLVM = "llvm"
+
+
+@dataclasses.dataclass
+class Toolchain:
+    compiler: Compiler
+    # This is relevant ONLY for LLVM and should not be required for GCC
+    version: int
+
+    @property
+    def short_name(self) -> str:
+        return str(self.compiler.value)
+
+    @property
+    def full_name(self) -> str:
+        if self.compiler == Compiler.GCC:
+            return self.short_name
+
+        return f"{self.short_name}-{self.version}"
+
+    def to_dict(self) -> Dict[str, Union[str, int]]:
+        return {
+            "name": self.short_name,
+            "fullname": self.full_name,
+            "version": self.version,
+        }
+
+
+@dataclasses.dataclass
+class BuildConfig:
+    arch: Arch
+    toolchain: Toolchain
+    kernel: str = "LATEST"
+    run_veristat: bool = False
+    parallel_tests: bool = False
+    build_release: bool = False
+
+    @property
+    def runs_on(self) -> List[str]:
+        if is_managed_repo():
+            return DEFAULT_SELF_HOSTED_RUNNER_TAGS + [self.arch.value]
+        else:
+            return [DEFAULT_RUNNER]
+
+    @property
+    def build_runs_on(self) -> List[str]:
+        if is_managed_repo():
+            return ["codebuild"]
+        else:
+            return [DEFAULT_RUNNER]
+
+    @property
+    def tests(self) -> Dict[str, Any]:
+        tests_list = [
+            "test_progs",
+            "test_progs_parallel",
+            "test_progs_no_alu32",
+            "test_progs_no_alu32_parallel",
+            "test_verifier",
+        ]
+
+        if self.arch.value != "s390x":
+            tests_list.append("test_maps")
+
+        if self.toolchain.version >= 18:
+            tests_list.append("test_progs_cpuv4")
+
+        # if self.arch in [Arch.X86_64, Arch.AARCH64]:
+        #     tests_list.append("sched_ext")
+
+        # Don't run GCC BPF runner, because too many tests are failing
+        # See: https://lore.kernel.org/bpf/87bjw6qpje.fsf@oracle.com/
+        # if self.arch == Arch.X86_64:
+        #    tests_list.append("test_progs-bpf_gcc")
+
+        if not self.parallel_tests:
+            tests_list = [test for test in tests_list if not test.endswith("parallel")]
+
+        return {"include": [generate_test_config(test) for test in tests_list]}
+
+    def to_dict(self) -> Dict[str, Any]:
+        return {
+            "arch": self.arch.value,
+            "toolchain": self.toolchain.to_dict(),
+            "kernel": self.kernel,
+            "run_veristat": self.run_veristat,
+            "parallel_tests": self.parallel_tests,
+            "build_release": self.build_release,
+            "runs_on": self.runs_on,
+            "tests": self.tests,
+            "build_runs_on": self.build_runs_on,
+        }
+
+
+def is_managed_repo() -> bool:
+    return (
+        os.environ["GITHUB_REPOSITORY_OWNER"] == MANAGED_OWNER
+        and os.environ["GITHUB_REPOSITORY"] in MANAGED_REPOS
+    )
+
+
+def set_output(name, value):
+    """Write an output variable to the GitHub output file."""
+    with open(os.getenv("GITHUB_OUTPUT"), "a", encoding="utf-8") as file:
+        file.write(f"{name}={value}\n")
+
+
+def generate_test_config(test: str) -> Dict[str, Union[str, int]]:
+    """Create the configuration for the provided test."""
+    is_parallel = test.endswith("_parallel")
+    config = {
+        "test": test,
+        "continue_on_error": is_parallel,
+        # While in experimental mode, parallel jobs may get stuck
+        # anywhere, including in user space where the kernel won't detect
+        # a problem and panic. We add a second layer of (smaller) timeouts
+        # here such that if we get stuck in a parallel run, we hit this
+        # timeout and fail without affecting the overall job success (as
+        # would be the case if we hit the job-wide timeout). For
+        # non-experimental jobs, 360 is the default which will be
+        # superseded by the overall workflow timeout (but we need to
+        # specify something).
+        "timeout_minutes": 30 if is_parallel else 360,
+    }
+    return config
+
+
+if __name__ == "__main__":
+    matrix = [
+        BuildConfig(
+            arch=Arch.X86_64,
+            toolchain=Toolchain(compiler=Compiler.GCC, version=DEFAULT_LLVM_VERSION),
+            run_veristat=True,
+            parallel_tests=True,
+        ),
+        BuildConfig(
+            arch=Arch.X86_64,
+            toolchain=Toolchain(compiler=Compiler.LLVM, version=DEFAULT_LLVM_VERSION),
+            build_release=True,
+        ),
+        BuildConfig(
+            arch=Arch.X86_64,
+            toolchain=Toolchain(compiler=Compiler.LLVM, version=18),
+            build_release=True,
+        ),
+        BuildConfig(
+            arch=Arch.AARCH64,
+            toolchain=Toolchain(compiler=Compiler.GCC, version=DEFAULT_LLVM_VERSION),
+        ),
+        BuildConfig(
+            arch=Arch.S390X,
+            toolchain=Toolchain(compiler=Compiler.GCC, version=DEFAULT_LLVM_VERSION),
+        ),
+    ]
+
+    # Outside of managed repositories only run on x86_64
+    if not is_managed_repo():
+        matrix = [config for config in matrix if config.arch == Arch.X86_64]
+
+    json_matrix = json.dumps({"include": [config.to_dict() for config in matrix]})
+    print(json.dumps(json.loads(json_matrix), indent=4))
+    set_output("build_matrix", json_matrix)
diff --git a/.github/scripts/tests/test_veristat_compare.py b/.github/scripts/tests/test_veristat_compare.py
new file mode 100644
index 0000000000000..b65b69295235d
--- /dev/null
+++ b/.github/scripts/tests/test_veristat_compare.py
@@ -0,0 +1,75 @@
+#!/usr/bin/env python3
+
+import unittest
+from typing import Iterable, List
+
+from ..veristat_compare import parse_table, VeristatFields
+
+
+def gen_csv_table(records: Iterable[str]) -> List[str]:
+    return [
+        ",".join(VeristatFields.headers()),
+        *records,
+    ]
+
+
+class TestVeristatCompare(unittest.TestCase):
+    def test_parse_table_ignore_new_prog(self):
+        table = gen_csv_table(
+            [
+                "prog_file.bpf.o,prog_name,N/A,success,N/A,N/A,1,N/A",
+            ]
+        )
+        veristat_info = parse_table(table)
+        self.assertEqual(veristat_info.table, [])
+        self.assertFalse(veristat_info.changes)
+        self.assertFalse(veristat_info.new_failures)
+
+    def test_parse_table_ignore_removed_prog(self):
+        table = gen_csv_table(
+            [
+                "prog_file.bpf.o,prog_name,success,N/A,N/A,1,N/A,N/A",
+            ]
+        )
+        veristat_info = parse_table(table)
+        self.assertEqual(veristat_info.table, [])
+        self.assertFalse(veristat_info.changes)
+        self.assertFalse(veristat_info.new_failures)
+
+    def test_parse_table_new_failure(self):
+        table = gen_csv_table(
+            [
+                "prog_file.bpf.o,prog_name,success,failure,MISMATCH,1,1,+0 (+0.00%)",
+            ]
+        )
+        veristat_info = parse_table(table)
+        self.assertEqual(
+            veristat_info.table,
+            [["prog_file.bpf.o", "prog_name", "success -> failure (!!)", "+0.00 %"]],
+        )
+        self.assertTrue(veristat_info.changes)
+        self.assertTrue(veristat_info.new_failures)
+
+    def test_parse_table_new_changes(self):
+        table = gen_csv_table(
+            [
+                "prog_file.bpf.o,prog_name,failure,success,MISMATCH,0,0,+0 (+0.00%)",
+                "prog_file.bpf.o,prog_name_increase,failure,failure,MATCH,1,2,+1 (+100.00%)",
+                "prog_file.bpf.o,prog_name_decrease,success,success,MATCH,1,1,-1 (-100.00%)",
+            ]
+        )
+        veristat_info = parse_table(table)
+        self.assertEqual(
+            veristat_info.table,
+            [
+                ["prog_file.bpf.o", "prog_name", "failure -> success", "+0.00 %"],
+                ["prog_file.bpf.o", "prog_name_increase", "failure", "+100.00 %"],
+                ["prog_file.bpf.o", "prog_name_decrease", "success", "-100.00 %"],
+            ],
+        )
+        self.assertTrue(veristat_info.changes)
+        self.assertFalse(veristat_info.new_failures)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/.github/scripts/tmpfsify-workspace.sh b/.github/scripts/tmpfsify-workspace.sh
new file mode 100755
index 0000000000000..6fd62b4ad2a49
--- /dev/null
+++ b/.github/scripts/tmpfsify-workspace.sh
@@ -0,0 +1,21 @@
+#!/bin/bash
+
+set -x -euo pipefail
+
+TMPFS_SIZE=20 # GB
+MEM_TOTAL=$(awk '/MemTotal/ {print int($2/1024)}' /proc/meminfo)
+
+# sanity check: total mem is at least double TMPFS_SIZE
+if [ $MEM_TOTAL -lt $(($TMPFS_SIZE*1024*2)) ]; then
+    echo "tmpfsify-workspace.sh: will not allocate tmpfs, total memory is too low (${MEM_TOTAL}MB)"
+    exit 0
+fi
+
+dir="$(basename "$GITHUB_WORKSPACE")"
+cd "$(dirname "$GITHUB_WORKSPACE")"
+mv "${dir}" "${dir}.backup"
+mkdir "${dir}"
+sudo mount -t tmpfs -o size=${TMPFS_SIZE}G tmpfs "${dir}"
+rsync -a "${dir}.backup/" "${dir}"
+cd -
+
diff --git a/.github/scripts/veristat_compare.py b/.github/scripts/veristat_compare.py
new file mode 100644
index 0000000000000..07271b8cbd3aa
--- /dev/null
+++ b/.github/scripts/veristat_compare.py
@@ -0,0 +1,263 @@
+#!/usr/bin/env python3
+
+# This script reads a CSV file produced by the following invocation:
+#
+#   veristat --emit file,prog,verdict,states \
+#            --output-format csv \
+#            --compare ...
+#
+# And produces a markdown summary for the file.
+# The summary is printed to standard output and appended to a file
+# pointed to by GITHUB_STEP_SUMMARY variable.
+#
+# Script exits with return code 1 if there are new failures in the
+# veristat results.
+#
+# For testing purposes invoke as follows:
+#
+#  GITHUB_STEP_SUMMARY=/dev/null python3 veristat-compare.py test.csv
+#
+# File format (columns):
+#  0. file_name
+#  1. prog_name
+#  2. verdict_base
+#  3. verdict_comp
+#  4. verdict_diff
+#  5. total_states_base
+#  6. total_states_comp
+#  7. total_states_diff
+#
+# Records sample:
+#  file-a,a,success,failure,MISMATCH,12,12,+0 (+0.00%)
+#  file-b,b,success,success,MATCH,67,67,+0 (+0.00%)
+#
+# For better readability suffixes '_OLD' and '_NEW'
+# are used instead of '_base' and '_comp' for variable
+# names etc.
+
+import io
+import os
+import sys
+import re
+import csv
+import logging
+import argparse
+import enum
+from dataclasses import dataclass
+from typing import Dict, Iterable, List, Final
+
+
+TRESHOLD_PCT: Final[int] = 0
+
+SUMMARY_HEADERS = ["File", "Program", "Verdict", "States Diff (%)"]
+
+# expected format: +0 (+0.00%) / -0 (-0.00%)
+TOTAL_STATES_DIFF_REGEX = (
+    r"(?P<absolute_diff>[+-]\d+) \((?P<percentage_diff>[+-]\d+\.\d+)\%\)"
+)
+
+
+TEXT_SUMMARY_TEMPLATE: Final[str] = (
+    """
+# {title}
+
+{table}
+""".strip()
+)
+
+HTML_SUMMARY_TEMPLATE: Final[str] = (
+    """
+# {title}
+
+<details>
+<summary>Click to expand</summary>
+
+{table}
+</details>
+""".strip()
+)
+
+GITHUB_MARKUP_REPLACEMENTS: Final[Dict[str, str]] = {
+    "->": "&rarr;",
+    "(!!)": ":bangbang:",
+}
+
+NEW_FAILURE_SUFFIX: Final[str] = "(!!)"
+
+
+class VeristatFields(str, enum.Enum):
+    FILE_NAME = "file_name"
+    PROG_NAME = "prog_name"
+    VERDICT_OLD = "verdict_base"
+    VERDICT_NEW = "verdict_comp"
+    VERDICT_DIFF = "verdict_diff"
+    TOTAL_STATES_OLD = "total_states_base"
+    TOTAL_STATES_NEW = "total_states_comp"
+    TOTAL_STATES_DIFF = "total_states_diff"
+
+    @classmethod
+    def headers(cls) -> List[str]:
+        return [
+            cls.FILE_NAME,
+            cls.PROG_NAME,
+            cls.VERDICT_OLD,
+            cls.VERDICT_NEW,
+            cls.VERDICT_DIFF,
+            cls.TOTAL_STATES_OLD,
+            cls.TOTAL_STATES_NEW,
+            cls.TOTAL_STATES_DIFF,
+        ]
+
+
+@dataclass
+class VeristatInfo:
+    table: list
+    changes: bool
+    new_failures: bool
+
+    def get_results_title(self) -> str:
+        if self.new_failures:
+            return "There are new veristat failures"
+
+        if self.changes:
+            return "There are changes in verification performance"
+
+        return "No changes in verification performance"
+
+    def get_results_summary(self, markup: bool = False) -> str:
+        title = self.get_results_title()
+        if not self.table:
+            return f"# {title}\n"
+
+        template = TEXT_SUMMARY_TEMPLATE
+        table = format_table(headers=SUMMARY_HEADERS, rows=self.table)
+
+        if markup:
+            template = HTML_SUMMARY_TEMPLATE
+            table = github_markup_decorate(table)
+
+        return template.format(title=title, table=table)
+
+
+def get_state_diff(value: str) -> float:
+    if value == "N/A":
+        return 0.0
+
+    matches = re.match(TOTAL_STATES_DIFF_REGEX, value)
+    if not matches:
+        raise ValueError(f"Failed to parse total states diff field value '{value}'")
+
+    if percentage_diff := matches.group("percentage_diff"):
+        return float(percentage_diff)
+
+    raise ValueError(f"Invalid {VeristatFields.TOTAL_STATES_DIFF} field value: {value}")
+
+
+def parse_table(csv_file: Iterable[str]) -> VeristatInfo:
+    reader = csv.DictReader(csv_file)
+    assert reader.fieldnames == VeristatFields.headers()
+
+    new_failures = False
+    changes = False
+    table = []
+
+    for record in reader:
+        add = False
+
+        verdict_old, verdict_new = (
+            record[VeristatFields.VERDICT_OLD],
+            record[VeristatFields.VERDICT_NEW],
+        )
+
+        # Ignore results from completely new and removed programs
+        if "N/A" in [verdict_new, verdict_old]:
+            continue
+
+        if record[VeristatFields.VERDICT_DIFF] == "MISMATCH":
+            changes = True
+            add = True
+            verdict = f"{verdict_old} -> {verdict_new}"
+            if verdict_new == "failure":
+                new_failures = True
+                verdict += f" {NEW_FAILURE_SUFFIX}"
+        else:
+            verdict = record[VeristatFields.VERDICT_NEW]
+
+        diff = get_state_diff(record[VeristatFields.TOTAL_STATES_DIFF])
+        if abs(diff) > TRESHOLD_PCT:
+            changes = True
+            add = True
+
+        if not add:
+            continue
+
+        table.append(
+            [
+                record[VeristatFields.FILE_NAME],
+                record[VeristatFields.PROG_NAME],
+                verdict,
+                f"{diff:+.2f} %",
+            ]
+        )
+
+    return VeristatInfo(table=table, changes=changes, new_failures=new_failures)
+
+
+def github_markup_decorate(input_str: str) -> str:
+    for text, markup in GITHUB_MARKUP_REPLACEMENTS.items():
+        input_str = input_str.replace(text, markup)
+    return input_str
+
+
+def format_table(headers: List[str], rows: List[List[str]]) -> str:
+    column_width = [
+        max(len(row[column_idx]) for row in [headers] + rows)
+        for column_idx in range(len(headers))
+    ]
+
+    # Row template string in the following format:
+    # "{0:8}|{1:10}|{2:15}|{3:7}|{4:10}"
+    row_template = "|".join(
+        f"{{{idx}:{width}}}" for idx, width in enumerate(column_width)
+    )
+    row_template_nl = f"|{row_template}|\n"
+
+    with io.StringIO() as out:
+        out.write(row_template_nl.format(*headers))
+
+        separator_row = ["-" * width for width in column_width]
+        out.write(row_template_nl.format(*separator_row))
+
+        for row in rows:
+            row_str = row_template_nl.format(*row)
+            out.write(row_str)
+
+        return out.getvalue()
+
+
+def main(compare_csv_filename: os.PathLike, output_filename: os.PathLike) -> None:
+    with open(compare_csv_filename, newline="", encoding="utf-8") as csv_file:
+        veristat_results = parse_table(csv_file)
+
+    sys.stdout.write(veristat_results.get_results_summary())
+
+    with open(output_filename, encoding="utf-8", mode="a") as file:
+        file.write(veristat_results.get_results_summary(markup=True))
+
+    if veristat_results.new_failures:
+        return 1
+
+    return 0
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(
+        description="Print veristat comparison output as markdown step summary"
+    )
+    parser.add_argument("filename")
+    args = parser.parse_args()
+    summary_filename = os.getenv("GITHUB_STEP_SUMMARY")
+    if not summary_filename:
+        logging.error("GITHUB_STEP_SUMMARY environment variable is not set")
+        sys.exit(1)
+    sys.exit(main(args.filename, summary_filename))
diff --git a/.github/workflows/gcc-bpf.yml b/.github/workflows/gcc-bpf.yml
new file mode 100644
index 0000000000000..8356a0af836f1
--- /dev/null
+++ b/.github/workflows/gcc-bpf.yml
@@ -0,0 +1,100 @@
+name: Testing GCC BPF compiler
+
+on:
+  workflow_call:
+    inputs:
+      runs_on:
+        required: true
+        type: string
+      arch:
+        required: true
+        type: string
+      llvm-version:
+        required: true
+        type: string
+      toolchain:
+        required: true
+        type: string
+      toolchain_full:
+        required: true
+        type: string
+      download_sources:
+        required: true
+        type: boolean
+
+jobs:
+  test:
+    name: GCC BPF
+    runs-on: >-
+      ${{
+          contains(fromJSON(inputs.runs_on), 'codebuild')
+          && format('codebuild-bpf-ci-{0}-{1}', github.run_id, github.run_attempt)
+          || fromJSON(inputs.runs_on)
+      }}
+    env:
+      ARCH: ${{ inputs.arch }}
+      BPF_NEXT_BASE_BRANCH: 'master'
+      GCC_BPF_INSTALL_DIR: ${{ github.workspace }}/gcc-bpf
+      GCC_BPF_RELEASE_REPO: 'theihor/gcc-bpf'
+      KBUILD_OUTPUT: ${{ github.workspace }}/src/kbuild-output
+      REPO_ROOT: ${{ github.workspace }}/src
+
+    steps:
+
+      - uses: actions/checkout@v4
+        with:
+          sparse-checkout: |
+            .github
+            ci
+
+      - if: ${{ inputs.download_sources }}
+        name: Download bpf-next tree
+        uses: libbpf/ci/get-linux-source@v3
+        with:
+          dest: ${{ env.REPO_ROOT }}
+          rev: ${{ env.BPF_NEXT_BASE_BRANCH }}
+
+      - if: ${{ ! inputs.download_sources }}
+        name: Checkout ${{ github.repository }} to ./src
+        uses: actions/checkout@v4
+        with:
+          path: 'src'
+
+      - uses:  libbpf/ci/patch-kernel@v3
+        with:
+          patches-root: '${{ github.workspace }}/ci/diffs'
+          repo-root: ${{ env.REPO_ROOT }}
+
+      - uses: actions/download-artifact@v4
+        with:
+          name: vmlinux-${{ inputs.arch }}-${{ inputs.toolchain_full }}
+          path: ${{ env.REPO_ROOT }}
+
+      - name: Untar artifacts
+        working-directory: ${{ env.REPO_ROOT }}
+        run: zstd -d -T0 vmlinux-${{ inputs.arch }}-${{ inputs.toolchain_full }}.tar.zst --stdout | tar -xf -
+
+      - name: Setup build environment
+        uses: libbpf/ci/setup-build-env@v3
+        with:
+          arch: ${{ inputs.arch }}
+          llvm-version: ${{ inputs.llvm-version }}
+
+      - name: Download GCC BPF compiler
+        shell: bash
+        env:
+          GH_TOKEN: ${{ github.token }}
+        run: .github/scripts/download-gcc-bpf.sh ${{ env.GCC_BPF_RELEASE_REPO }} ${{ env.GCC_BPF_INSTALL_DIR }}
+
+      - name: Build selftests/bpf/test_progs-bpf_gcc
+        uses: libbpf/ci/build-selftests@v3
+        env:
+          BPF_GCC: ${{ env.GCC_BPF_INSTALL_DIR }}
+          MAX_MAKE_JOBS: 32
+          SELFTESTS_BPF_TARGETS: 'test_progs-bpf_gcc'
+        with:
+          arch: ${{ inputs.arch }}
+          kernel-root: ${{ env.REPO_ROOT }}
+          llvm-version: ${{ inputs.llvm-version }}
+          toolchain: ${{ inputs.toolchain }}
+
diff --git a/.github/workflows/kernel-build-test.yml b/.github/workflows/kernel-build-test.yml
new file mode 100644
index 0000000000000..541ef910b1d28
--- /dev/null
+++ b/.github/workflows/kernel-build-test.yml
@@ -0,0 +1,147 @@
+name: Reusable Build/Test/Veristat workflow
+
+on:
+  workflow_call:
+    inputs:
+      arch:
+        required: true
+        type: string
+        description: The architecture to build against, e.g x86_64, aarch64, s390x...
+      toolchain_full:
+        required: true
+        type: string
+        description: The toolchain and for llvm, its version, e.g gcc, llvm-15
+      toolchain:
+        required: true
+        type: string
+        description: The toolchain, e.g gcc, llvm
+      runs_on:
+        required: true
+        type: string
+        description: The runners to run the test on. This is a json string representing an array of labels.
+      build_runs_on:
+        required: true
+        type: string
+        description: The runners to run the builds on. This is a json string representing an array of labels.
+      llvm-version:
+        required: true
+        type: string
+        description: The version of LLVM used to build selftest.... for llvm toolchain, this should match the one from toolchain_full, for gcc it is an arbritrary version we decide to build selftests against.
+      kernel:
+        required: true
+        type: string
+        description: The kernel to run the test against. For KPD this is always LATEST, which runs against a newly built kernel.
+      tests:
+        required: true
+        type: string
+        description: A serialized json array with the tests to be running, it must follow the json-matrix format, https://www.jitsejan.com/use-github-actions-with-json-file-as-matrix
+      run_veristat:
+        required: true
+        type: boolean
+        description: Whether or not to run the veristat job.
+      run_tests:
+        required: true
+        type: boolean
+        description: Whether or not to run the test job.
+      download_sources:
+        required: true
+        type: boolean
+        description: Whether to download the linux sources into the working directory.
+        default: false
+      build_release:
+        required: true
+        type: boolean
+        description: Build selftests with -O2 optimization in addition to non-optimized build.
+        default: false
+    secrets:
+      AWS_ROLE_ARN:
+        required: true
+
+jobs:
+
+  # Build kernel and selftest
+  build:
+    uses: ./.github/workflows/kernel-build.yml
+    with:
+      arch: ${{ inputs.arch }}
+      toolchain_full: ${{ inputs.toolchain_full }}
+      toolchain: ${{ inputs.toolchain }}
+      runs_on: ${{ inputs.build_runs_on }}
+      llvm-version: ${{ inputs.llvm-version }}
+      kernel: ${{ inputs.kernel }}
+      download_sources: ${{ inputs.download_sources }}
+
+  build-release:
+    if: ${{ inputs.build_release }}
+    uses: ./.github/workflows/kernel-build.yml
+    with:
+      arch: ${{ inputs.arch }}
+      toolchain_full: ${{ inputs.toolchain_full }}
+      toolchain: ${{ inputs.toolchain }}
+      runs_on: ${{ inputs.build_runs_on }}
+      llvm-version: ${{ inputs.llvm-version }}
+      kernel: ${{ inputs.kernel }}
+      download_sources: ${{ inputs.download_sources }}
+      release: true
+
+  test:
+    if: ${{ inputs.run_tests }}
+    uses: ./.github/workflows/kernel-test.yml
+    # Setting name to test here to avoid lengthy autogenerated names due to matrix
+    # e.g build-and-test x86_64-gcc / test (test_progs_parallel, true, 30) / test_progs_parallel on x86_64 with gcc
+    name: "test"
+    needs: [build]
+    strategy:
+      fail-fast: false
+      matrix: ${{ fromJSON(inputs.tests) }}
+    with:
+      arch: ${{ inputs.arch }}
+      toolchain_full: ${{ inputs.toolchain_full }}
+      runs_on: ${{ inputs.runs_on }}
+      kernel: ${{ inputs.kernel }}
+      test: ${{ matrix.test }}
+      continue_on_error: ${{ toJSON(matrix.continue_on_error) }}
+      timeout_minutes: ${{ matrix.timeout_minutes }}
+
+  veristat-kernel:
+    if: ${{ inputs.run_veristat }}
+    uses: ./.github/workflows/veristat-kernel.yml
+    needs: [build]
+    permissions:
+      id-token: write
+      contents: read
+    with:
+      arch: ${{ inputs.arch }}
+      toolchain: ${{ inputs.toolchain }}
+      runs_on: ${{ inputs.runs_on }}
+
+  veristat-meta:
+    # Check for vars.AWS_REGION is necessary to skip this job in case of a PR from a fork.
+    if: ${{ inputs.run_veristat && github.repository_owner == 'kernel-patches' && vars.AWS_REGION }}
+    uses: ./.github/workflows/veristat-meta.yml
+    needs: [build]
+    permissions:
+      id-token: write
+      contents: read
+    with:
+      arch: ${{ inputs.arch }}
+      toolchain: ${{ inputs.toolchain }}
+      aws_region: ${{ vars.AWS_REGION }}
+      runs_on: ${{ inputs.runs_on }}
+    secrets:
+      AWS_ROLE_ARN: ${{ secrets.AWS_ROLE_ARN }}
+
+  gcc-bpf:
+    name: 'GCC BPF'
+    if: ${{ inputs.arch == 'x86_64' }}
+    uses: ./.github/workflows/gcc-bpf.yml
+    needs: [build]
+    with:
+      # GCC BPF does not need /dev/kvm, so use the "build" runners
+      runs_on: ${{ inputs.build_runs_on }}
+      arch: ${{ inputs.arch }}
+      llvm-version: ${{ inputs.llvm-version }}
+      toolchain: ${{ inputs.toolchain }}
+      toolchain_full: ${{ inputs.toolchain_full }}
+      download_sources: ${{ inputs.download_sources }}
+
diff --git a/.github/workflows/kernel-build.yml b/.github/workflows/kernel-build.yml
new file mode 100644
index 0000000000000..513d96411921e
--- /dev/null
+++ b/.github/workflows/kernel-build.yml
@@ -0,0 +1,191 @@
+
+name: Reusable build workflow
+
+on:
+  workflow_call:
+    inputs:
+      arch:
+        required: true
+        type: string
+        description: The architecture to build against, e.g x86_64, aarch64, s390x...
+      toolchain_full:
+        required: true
+        type: string
+        description: The toolchain and for llvm, its version, e.g gcc, llvm-15
+      toolchain:
+        required: true
+        type: string
+        description: The toolchain, e.g gcc, llvm
+      runs_on:
+        required: true
+        type: string
+        description: The runners to run the test on. This is a json string representing an array of labels.
+      llvm-version:
+        required: true
+        type: string
+        description: The version of LLVM used to build selftest.... for llvm toolchain, this should match the one from toolchain_full, for gcc it is an arbritrary version we decide to build selftests against.
+      kernel:
+        required: true
+        type: string
+        description: The kernel to run the test against. For KPD this is always LATEST, which runs against a newly built kernel.
+      download_sources:
+        required: true
+        type: boolean
+        description: Whether to download the linux sources into the working directory.
+        default: false
+      release:
+        required: false
+        type: boolean
+        description: Build selftest with -O2 optimization
+        default: false
+
+jobs:
+  build:
+    name: build for ${{ inputs.arch }} with ${{ inputs.toolchain_full }}${{ inputs.release && '-O2' || '' }}
+    # To run on CodeBuild, runs-on value must correspond to the AWS
+    # CodeBuild project associated with the kernel-patches webhook
+    # However matrix.py passes just a 'codebuild' string
+    runs-on: >-
+      ${{
+          contains(fromJSON(inputs.runs_on), 'codebuild')
+          && format('codebuild-bpf-ci-{0}-{1}', github.run_id, github.run_attempt)
+          || fromJSON(inputs.runs_on)
+      }}
+    env:
+        ARTIFACTS_ARCHIVE: "vmlinux-${{ inputs.arch }}-${{ inputs.toolchain_full }}.tar.zst"
+        BPF_NEXT_BASE_BRANCH: 'master'
+        BPF_NEXT_FETCH_DEPTH: 64 # A bit of history is needed to facilitate incremental builds
+        CROSS_COMPILE: ${{ inputs.arch != 'x86_64' && 'true' || '' }}
+        # BUILD_SCHED_EXT_SELFTESTS: ${{ inputs.arch == 'x86_64' || inputs.arch == 'aarch64' && 'true' || '' }}
+        KBUILD_OUTPUT: ${{ github.workspace }}/kbuild-output
+        KERNEL: ${{ inputs.kernel }}
+        KERNEL_ROOT: ${{ github.workspace }}
+        REPO_PATH: ""
+        REPO_ROOT: ${{ github.workspace }}
+        RUNNER_TYPE: ${{ github.repository_owner == 'kernel-patches' && 'codebuild' || 'default' }}
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: ${{ inputs.download_sources && 1 || env.BPF_NEXT_FETCH_DEPTH }}
+
+      - if: ${{ env.RUNNER_TYPE == 'codebuild' }}
+        shell: bash
+        run: .github/scripts/tmpfsify-workspace.sh
+
+      - if: ${{ inputs.download_sources }}
+        name: Download bpf-next tree
+        env:
+          FETCH_DEPTH: ${{ env.BPF_NEXT_FETCH_DEPTH }}
+        uses: libbpf/ci/get-linux-source@v3
+        with:
+          dest: '.kernel'
+          rev: ${{ env.BPF_NEXT_BASE_BRANCH }}
+      - uses: libbpf/ci/prepare-incremental-build@v3
+        with:
+          repo-root: ${{ inputs.download_sources && '.kernel' || env.REPO_ROOT }}
+          base-branch: >-
+            ${{    inputs.download_sources && env.BPF_NEXT_BASE_BRANCH
+                || github.event_name == 'pull_request' && github.base_ref
+                || github.ref_name
+             }}
+          arch: ${{ inputs.arch }}
+          toolchain_full: ${{ inputs.toolchain_full }}
+          kbuild-output: ${{ env.KBUILD_OUTPUT }}
+      - if: ${{ inputs.download_sources }}
+        name: Move linux source in place
+        shell: bash
+        run: |
+          cd .kernel
+          rm -rf .git
+          mv -t .. $(ls -A)
+          cd ..
+          rmdir .kernel
+      - uses:  libbpf/ci/patch-kernel@v3
+        with:
+          patches-root: '${{ github.workspace }}/ci/diffs'
+          repo-root: ${{ env.REPO_ROOT }}
+
+      - name: Setup build environment
+        uses: libbpf/ci/setup-build-env@v3
+        with:
+          arch: ${{ inputs.arch }}
+          llvm-version: ${{ inputs.llvm-version }}
+          pahole: master
+
+        # We have to setup qemu+binfmt in order to enable cross-compation of selftests.
+        # During selftests build, freshly built bpftool is executed.
+        # On self-hosted bare-metal hosts binfmt is pre-configured.
+      - if: ${{ env.RUNNER_TYPE == 'codebuild' && env.CROSS_COMPILE }}
+        name: Set up docker
+        uses: docker/setup-docker-action@v4
+      - if: ${{ env.RUNNER_TYPE == 'codebuild' && env.CROSS_COMPILE }}
+        name: Setup binfmt and qemu
+        uses: docker/setup-qemu-action@v3
+        with:
+          image: tonistiigi/binfmt:qemu-v9.2.0
+
+      - name: Build kernel image
+        uses: libbpf/ci/build-linux@v3
+        with:
+          arch: ${{ inputs.arch }}
+          toolchain: ${{ inputs.toolchain }}
+          kbuild-output: ${{ env.KBUILD_OUTPUT }}
+          max-make-jobs: 32
+          llvm-version: ${{ inputs.llvm-version }}
+
+      - name: Build selftests/bpf
+        uses: libbpf/ci/build-selftests@v3
+        env:
+          MAX_MAKE_JOBS: 32
+          RELEASE: ${{ inputs.release && '1' || '' }}
+        with:
+          arch: ${{ inputs.arch }}
+          kernel-root: ${{ env.KERNEL_ROOT }}
+          llvm-version: ${{ inputs.llvm-version }}
+          toolchain: ${{ inputs.toolchain }}
+
+      - if: ${{ env.BUILD_SCHED_EXT_SELFTESTS }}
+        name: Build selftests/sched_ext
+        uses: libbpf/ci/build-scx-selftests@v3
+        with:
+          kbuild-output: ${{ env.KBUILD_OUTPUT }}
+          repo-root: ${{ env.REPO_ROOT }}
+          arch: ${{ inputs.arch }}
+          toolchain: ${{ inputs.toolchain }}
+          llvm-version: ${{ inputs.llvm-version }}
+          max-make-jobs: 32
+
+      - if: ${{ github.event_name != 'push' }}
+        name: Build samples
+        uses: libbpf/ci/build-samples@v3
+        with:
+          arch: ${{ inputs.arch }}
+          toolchain: ${{ inputs.toolchain }}
+          kbuild-output: ${{ env.KBUILD_OUTPUT }}
+          max-make-jobs: 32
+          llvm-version: ${{ inputs.llvm-version }}
+      - name: Tar artifacts
+        id: tar-artifacts
+        uses: libbpf/ci/tar-artifacts@v3
+        env:
+          ARCHIVE_BPF_SELFTESTS: 'true'
+          ARCHIVE_MAKE_HELPERS: 'true'
+          ARCHIVE_SCHED_EXT_SELFTESTS: ${{ env.BUILD_SCHED_EXT_SELFTESTS }}
+        with:
+          arch: ${{ inputs.arch }}
+          archive: ${{ env.ARTIFACTS_ARCHIVE }}
+          kbuild-output: ${{ env.KBUILD_OUTPUT }}
+          repo-root: ${{ env.REPO_ROOT }}
+      - if: ${{ github.event_name != 'push' }}
+        name: Remove KBUILD_OUTPUT content
+        shell: bash
+        run: |
+          # Remove $KBUILD_OUTPUT to prevent cache creation for pull requests.
+          # Only on pushed changes are build artifacts actually cached, because
+          # of github.com/actions/cache's cache isolation logic.
+          rm -rf "${KBUILD_OUTPUT}"
+      - uses: actions/upload-artifact@v4
+        with:
+          name: vmlinux-${{ inputs.arch }}-${{ inputs.toolchain_full }}${{ inputs.release && '-release' || '' }}
+          if-no-files-found: error
+          path: ${{ env.ARTIFACTS_ARCHIVE }}
diff --git a/.github/workflows/kernel-test.yml b/.github/workflows/kernel-test.yml
new file mode 100644
index 0000000000000..6eda80362b9b0
--- /dev/null
+++ b/.github/workflows/kernel-test.yml
@@ -0,0 +1,88 @@
+name: Reusable test workflow
+
+on:
+  workflow_call:
+    inputs:
+      arch:
+        required: true
+        type: string
+        description: The architecture to build against, e.g x86_64, aarch64, s390x...
+      toolchain_full:
+        required: true
+        type: string
+        description: The toolchain and for llvm, its version, e.g gcc, llvm-15
+      runs_on:
+        required: true
+        type: string
+        description: The runners to run the test on. This is a json string representing an array of labels.
+      kernel:
+        required: true
+        type: string
+        description: The kernel to run the test against. For KPD this is always LATEST, which runs against a newly built kernel.
+      test:
+        required: true
+        type: string
+        description: The test to run in the vm, e.g test_progs, test_maps, test_progs_no_alu32...
+      continue_on_error:
+        required: true
+        type: string
+        description: Whether to continue on error. This is typically set to true for parallel tests which are currently known to fail, but we don't want to fail the whole CI because of that.
+      timeout_minutes:
+        required: true
+        type: number
+        description: In case a test runs for too long, after how many seconds shall we timeout and error.
+
+jobs:
+  test:
+    name: ${{ inputs.test }} on ${{ inputs.arch }} with ${{ inputs.toolchain_full }}
+    runs-on: ${{ fromJSON(inputs.runs_on) }}
+    timeout-minutes: 100
+    env:
+      ARCH: ${{ inputs.arch }}
+      KERNEL: ${{ inputs.kernel }}
+      REPO_ROOT: ${{ github.workspace }}
+      REPO_PATH: ""
+      # https://github.com/actions/runner/issues/1483#issuecomment-1031671517
+      # booleans are weird in GH.
+      CONTINUE_ON_ERROR: ${{ inputs.continue_on_error }}
+      DEPLOYMENT: ${{ github.repository == 'kernel-patches/bpf' && 'prod' || 'rc' }}
+      ALLOWLIST_FILE: /tmp/allowlist
+      DENYLIST_FILE: /tmp/denylist
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          sparse-checkout: |
+            .github
+            ci
+
+      - uses: actions/download-artifact@v4
+        with:
+          name: vmlinux-${{ inputs.arch }}-${{ inputs.toolchain_full }}
+          path: .
+
+      - name: Untar artifacts
+        # zstd is installed by default in the runner images.
+        run: zstd -d -T0  vmlinux-${{ inputs.arch }}-${{ inputs.toolchain_full }}.tar.zst --stdout | tar -xf -
+
+      - name: Run selftests
+        uses: libbpf/ci/run-vmtest@v3
+        # https://github.com/actions/runner/issues/1483#issuecomment-1031671517
+        # booleans are weird in GH.
+        continue-on-error: ${{ fromJSON(env.CONTINUE_ON_ERROR) }}
+        timeout-minutes: ${{ inputs.timeout_minutes }}
+        env:
+          ARCH: ${{ inputs.arch }}
+          DEPLOYMENT: ${{ env.DEPLOYMENT }}
+          KERNEL_TEST: ${{ inputs.test }}
+          SELFTESTS_BPF: ${{ github.workspace }}/selftests/bpf
+          VMTEST_CONFIGS: ${{ github.workspace }}/ci/vmtest/configs
+          TEST_PROGS_WATCHDOG_TIMEOUT: 600
+        with:
+          arch: ${{ inputs.arch }}
+          vmlinuz: '${{ github.workspace }}/vmlinuz'
+          kernel-root: ${{ env.REPO_ROOT }}
+          max-cpu: 8
+          kernel-test: ${{ inputs.test }}
+          # Here we must use kbuild-output local to the repo, because
+          # it was extracted from the artifacts.
+          kbuild-output: ${{ env.REPO_ROOT }}/kbuild-output
diff --git a/.github/workflows/lint.yml b/.github/workflows/lint.yml
new file mode 100644
index 0000000000000..1c910fd297309
--- /dev/null
+++ b/.github/workflows/lint.yml
@@ -0,0 +1,65 @@
+name: "lint"
+
+on:
+  pull_request:
+  push:
+    branches:
+      - master
+
+jobs:
+  shellcheck:
+    # This workflow gets injected into other Linux repositories, but we don't
+    # want it to run there.
+    if: ${{ github.repository == 'kernel-patches/vmtest' }}
+    name: ShellCheck
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+      - name: Run ShellCheck
+        uses: ludeeus/action-shellcheck@master
+        env:
+          SHELLCHECK_OPTS: --severity=warning --exclude=SC1091
+
+  # Ensure some consistency in the formatting.
+  lint:
+    if: ${{ github.repository == 'kernel-patches/vmtest' }}
+    name: Lint
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+      - name: Run black
+        uses: psf/black@stable
+        with:
+          src: ./.github/scripts
+
+  validate_matrix:
+    if: ${{ github.repository == 'kernel-patches/vmtest' }}
+    name: Validate matrix.py
+    runs-on: ubuntu-latest
+    env:
+      GITHUB_REPOSITORY_OWNER: ${{ matrix.owner }}
+      GITHUB_REPOSITORY: ${{ matrix.repository }}
+      GITHUB_OUTPUT: /dev/stdout
+    strategy:
+      matrix:
+        owner: ['kernel-patches', 'foo']
+        repository: ['bpf', 'vmtest', 'bar']
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+      - name: run script
+        run: |
+          python3 .github/scripts/matrix.py
+
+  unittests:
+    if: ${{ github.repository == 'kernel-patches/vmtest' }}
+    name: Unittests
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+      - name: Run unittests
+        run: python3 -m unittest scripts/tests/*.py
+        working-directory: .github
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
new file mode 100644
index 0000000000000..df709c15a2cf1
--- /dev/null
+++ b/.github/workflows/test.yml
@@ -0,0 +1,64 @@
+name: bpf-ci
+
+on:
+  pull_request:
+  push:
+    branches:
+      - bpf_base
+      - bpf-next_base
+      - bpf-net_base
+      - for-next_base
+
+concurrency:
+  group: ci-test-${{ github.ref_name }}
+  cancel-in-progress: true
+
+jobs:
+  set-matrix:
+    # FIXME: set-matrix is lightweight, run it on any self-hosted machines for kernel-patches org
+    # so we do not wait for GH hosted runners when there potentially all are busy because of bpf-rc
+    # repo for instance.
+    # This could be somehow fixed long term by making this action/workflow re-usable and letting the called
+    # specify what to run on.
+    runs-on: ${{ github.repository_owner == 'kernel-patches' && 'x86_64' || 'ubuntu-latest' }}
+    outputs:
+      build-matrix: ${{ steps.set-matrix-impl.outputs.build_matrix }}
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          sparse-checkout: |
+            .github
+            ci
+      - id: set-matrix-impl
+        run: |
+          python3 .github/scripts/matrix.py
+
+  build-and-test:
+    # Setting name to arch-compiler here to avoid lengthy autogenerated names due to matrix
+    # e.g build-and-test x86_64-gcc / test (test_progs_parallel, true, 30) / test_progs_parallel on x86_64 with gcc
+    name: "${{ matrix.arch }}-${{ matrix.toolchain.fullname }}"
+    uses: ./.github/workflows/kernel-build-test.yml
+    needs: [set-matrix]
+    permissions:
+      id-token: write
+      contents: read
+    strategy:
+      fail-fast: false
+      matrix: ${{ fromJSON(needs.set-matrix.outputs.build-matrix) }}
+    with:
+      arch: ${{ matrix.arch }}
+      toolchain_full: ${{ matrix.toolchain.fullname }}
+      toolchain: ${{ matrix.toolchain.name }}
+      runs_on: ${{ toJSON(matrix.runs_on) }}
+      build_runs_on: ${{ toJSON(matrix.build_runs_on) }}
+      llvm-version: ${{ matrix.toolchain.version }}
+      kernel: ${{ matrix.kernel }}
+      tests: ${{ toJSON(matrix.tests) }}
+      run_veristat: ${{ matrix.run_veristat }}
+      # We only run tests on pull requests.
+      run_tests: ${{ github.event_name != 'push' }}
+      # Download sources
+      download_sources: ${{ github.repository == 'kernel-patches/vmtest' }}
+      build_release: ${{ matrix.build_release }}
+    secrets:
+      AWS_ROLE_ARN: ${{ secrets.AWS_ROLE_ARN }}
diff --git a/.github/workflows/veristat-kernel.yml b/.github/workflows/veristat-kernel.yml
new file mode 100644
index 0000000000000..0557daebf5bab
--- /dev/null
+++ b/.github/workflows/veristat-kernel.yml
@@ -0,0 +1,65 @@
+name: veristat_kernel
+
+on:
+  workflow_call:
+    inputs:
+      arch:
+        required: true
+        type: string
+        description: The architecture to build against, e.g x86_64, aarch64, s390x...
+      toolchain:
+        required: true
+        type: string
+        description: The toolchain, e.g gcc, llvm
+      runs_on:
+        required: true
+        type: string
+        description: The runners to run the test on. This is a json string representing an array of labels.
+
+jobs:
+  veristat:
+    name: ${{ inputs.arch }}-${{ inputs.toolchain }} veristat_kernel
+    runs-on: ${{ fromJSON(inputs.runs_on) }}
+    timeout-minutes: 100
+    permissions:
+        id-token: write
+        contents: read
+    env:
+      KERNEL: LATEST
+      REPO_ROOT: ${{ github.workspace }}
+      REPO_PATH: ""
+      KBUILD_OUTPUT: kbuild-output/
+      ARCH_AND_TOOL: ${{ inputs.arch }}-${{ inputs.toolchain }}
+
+    steps:
+
+      - uses: actions/checkout@v4
+        with:
+          sparse-checkout: |
+            .github
+            ci
+
+      - uses: actions/download-artifact@v4
+        with:
+          name: vmlinux-${{ env.ARCH_AND_TOOL }}
+          path: .
+
+      - name: Untar artifacts
+        run: zstd -d -T0  vmlinux-${{ env.ARCH_AND_TOOL }}.tar.zst --stdout | tar -xf -
+
+      - name: Run veristat
+        uses: libbpf/ci/run-vmtest@v3
+        with:
+          arch: x86_64
+          vmlinuz: '${{ github.workspace }}/vmlinuz'
+          kernel-root: '.'
+          max-cpu: 8
+          kernel-test: 'run_veristat_kernel'
+          output-dir: '${{ github.workspace }}'
+
+      - name: Compare and save veristat.kernel.csv
+        uses: ./.github/actions/veristat_baseline_compare
+        with:
+          veristat_output: veristat-kernel
+          baseline_name: ${{ env.ARCH_AND_TOOL}}-baseline-veristat-kernel
+
diff --git a/.github/workflows/veristat-meta.yml b/.github/workflows/veristat-meta.yml
new file mode 100644
index 0000000000000..00700a8205e62
--- /dev/null
+++ b/.github/workflows/veristat-meta.yml
@@ -0,0 +1,87 @@
+name: veristat_meta
+
+on:
+  workflow_call:
+    inputs:
+      arch:
+        required: true
+        type: string
+        description: The architecture to build against, e.g x86_64, aarch64, s390x...
+      toolchain:
+        required: true
+        type: string
+        description: The toolchain, e.g gcc, llvm
+      runs_on:
+        required: true
+        type: string
+        description: The runners to run the test on. This is a json string representing an array of labels.
+      aws_region:
+        required: true
+        type: string
+        description: The AWS region where we pull bpf objects to run against veristat.
+    secrets:
+        AWS_ROLE_ARN:
+            required: true
+            description: The AWS role used by GH to pull BPF objects from AWS.
+
+jobs:
+  veristat:
+    name: ${{ inputs.arch }}-${{ inputs.toolchain }} veristat_meta
+    runs-on: ${{ fromJSON(inputs.runs_on) }}
+    timeout-minutes: 100
+    permissions:
+        id-token: write
+        contents: read
+    env:
+      KERNEL: LATEST
+      REPO_ROOT: ${{ github.workspace }}
+      REPO_PATH: ""
+      KBUILD_OUTPUT: kbuild-output/
+      ARCH_AND_TOOL: ${{ inputs.arch }}-${{ inputs.toolchain }}
+
+    steps:
+
+      - uses: actions/checkout@v4
+        with:
+          sparse-checkout: |
+            .github
+            ci
+
+      - uses: actions/download-artifact@v4
+        with:
+          name: vmlinux-${{ env.ARCH_AND_TOOL }}
+          path: .
+
+      - name: Untar artifacts
+        run: zstd -d -T0  vmlinux-${{ env.ARCH_AND_TOOL }}.tar.zst --stdout | tar -xf -
+
+      - name: Configure AWS Credentials
+        uses: aws-actions/configure-aws-credentials@v3
+        with:
+          aws-region: ${{ inputs.aws_region }}
+          role-to-assume: ${{ secrets.AWS_ROLE_ARN }}
+          role-session-name: github-action-bpf-ci
+
+      - name: Download BPF objects
+        run: |
+          mkdir ./bpf_objects
+          aws s3 sync s3://veristat-bpf-binaries ./bpf_objects
+        env:
+          AWS_ROLE_ARN: ${{ secrets.AWS_ROLE_ARN }}
+
+      - name: Run veristat
+        uses: libbpf/ci/run-vmtest@v3
+        with:
+          arch: x86_64
+          vmlinuz: '${{ github.workspace }}/vmlinuz'
+          kernel-root: '.'
+          max-cpu: 8
+          kernel-test: 'run_veristat_meta'
+          output-dir: '${{ github.workspace }}'
+
+      - name: Compare and save veristat.meta.csv
+        uses: ./.github/actions/veristat_baseline_compare
+        with:
+          veristat_output: veristat-meta
+          baseline_name: ${{ env.ARCH_AND_TOOL}}-baseline-veristat-meta
+
diff --git a/README b/README
index fd903645e6de0..e69de29bb2d1d 100644
--- a/README
+++ b/README
@@ -1,18 +0,0 @@
-Linux kernel
-============
-
-There are several guides for kernel developers and users. These guides can
-be rendered in a number of formats, like HTML and PDF. Please read
-Documentation/admin-guide/README.rst first.
-
-In order to build the documentation, use ``make htmldocs`` or
-``make pdfdocs``.  The formatted documentation can also be read online at:
-
-    https://www.kernel.org/doc/html/latest/
-
-There are various text files in the Documentation/ subdirectory,
-several of them using the reStructuredText markup notation.
-
-Please read the Documentation/process/changes.rst file, as it contains the
-requirements for building and running the kernel, and information about
-the problems which may result by upgrading your kernel.
diff --git a/ci/diffs/.keep b/ci/diffs/.keep
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/ci/diffs/0001-Revert-bpf-Avoid-unnecessary-audit-log-for-CPU-secur.patch b/ci/diffs/0001-Revert-bpf-Avoid-unnecessary-audit-log-for-CPU-secur.patch
new file mode 100644
index 0000000000000..3b6139225e7bf
--- /dev/null
+++ b/ci/diffs/0001-Revert-bpf-Avoid-unnecessary-audit-log-for-CPU-secur.patch
@@ -0,0 +1,33 @@
+From 5440a12ac8fb2a8e051c597fcf5d85b427fe612a Mon Sep 17 00:00:00 2001
+From: Andrii Nakryiko <andrii@kernel.org>
+Date: Fri, 13 Oct 2023 12:44:34 -0700
+Subject: [PATCH] Revert "bpf: Avoid unnecessary audit log for CPU security
+ mitigations"
+
+This reverts commit 236334aeec0f93217cf9235f2004e61a0a1a5985.
+---
+ include/linux/bpf.h | 4 ++--
+ 1 file changed, 2 insertions(+), 2 deletions(-)
+
+diff --git a/include/linux/bpf.h b/include/linux/bpf.h
+index f0891ba24cb1..61bde4520f5c 100644
+--- a/include/linux/bpf.h
++++ b/include/linux/bpf.h
+@@ -2164,12 +2164,12 @@ static inline bool bpf_allow_uninit_stack(void)
+ 
+ static inline bool bpf_bypass_spec_v1(void)
+ {
+-	return cpu_mitigations_off() || perfmon_capable();
++	return perfmon_capable() || cpu_mitigations_off();
+ }
+ 
+ static inline bool bpf_bypass_spec_v4(void)
+ {
+-	return cpu_mitigations_off() || perfmon_capable();
++	return perfmon_capable() || cpu_mitigations_off();
+ }
+ 
+ int bpf_map_new_fd(struct bpf_map *map, int flags);
+-- 
+2.34.1
+
diff --git a/ci/diffs/0001-arch-Kconfig-Move-SPECULATION_MITIGATIONS-to-arch-Kc.patch b/ci/diffs/0001-arch-Kconfig-Move-SPECULATION_MITIGATIONS-to-arch-Kc.patch
new file mode 100644
index 0000000000000..63bdd28adedd2
--- /dev/null
+++ b/ci/diffs/0001-arch-Kconfig-Move-SPECULATION_MITIGATIONS-to-arch-Kc.patch
@@ -0,0 +1,69 @@
+From c71766e8ff7a7f950522d25896fba758585500df Mon Sep 17 00:00:00 2001
+From: Song Liu <song@kernel.org>
+Date: Mon, 22 Apr 2024 21:14:40 -0700
+Subject: [PATCH] arch/Kconfig: Move SPECULATION_MITIGATIONS to arch/Kconfig
+
+SPECULATION_MITIGATIONS is currently defined only for x86. As a result,
+IS_ENABLED(CONFIG_SPECULATION_MITIGATIONS) is always false for other
+archs. f337a6a21e2f effectively set "mitigations=off" by default on
+non-x86 archs, which is not desired behavior. Jakub observed this
+change when running bpf selftests on s390 and arm64.
+
+Fix this by moving SPECULATION_MITIGATIONS to arch/Kconfig so that it is
+available in all archs and thus can be used safely in kernel/cpu.c
+
+Fixes: f337a6a21e2f ("x86/cpu: Actually turn off mitigations by default for SPECULATION_MITIGATIONS=n")
+Cc: stable@vger.kernel.org
+Cc: Sean Christopherson <seanjc@google.com>
+Cc: Ingo Molnar <mingo@kernel.org>
+Cc: Daniel Sneddon <daniel.sneddon@linux.intel.com>
+Cc: Jakub Kicinski <kuba@kernel.org>
+Signed-off-by: Song Liu <song@kernel.org>
+---
+ arch/Kconfig     | 10 ++++++++++
+ arch/x86/Kconfig | 10 ----------
+ 2 files changed, 10 insertions(+), 10 deletions(-)
+
+diff --git a/arch/Kconfig b/arch/Kconfig
+index 9f066785bb71..8f4af75005f8 100644
+--- a/arch/Kconfig
++++ b/arch/Kconfig
+@@ -1609,4 +1609,14 @@ config CC_HAS_SANE_FUNCTION_ALIGNMENT
+ 	# strict alignment always, even with -falign-functions.
+ 	def_bool CC_HAS_MIN_FUNCTION_ALIGNMENT || CC_IS_CLANG
+ 
++menuconfig SPECULATION_MITIGATIONS
++	bool "Mitigations for speculative execution vulnerabilities"
++	default y
++	help
++	  Say Y here to enable options which enable mitigations for
++	  speculative execution hardware vulnerabilities.
++
++	  If you say N, all mitigations will be disabled. You really
++	  should know what you are doing to say so.
++
+ endmenu
+diff --git a/arch/x86/Kconfig b/arch/x86/Kconfig
+index 39886bab943a..50c890fce5e0 100644
+--- a/arch/x86/Kconfig
++++ b/arch/x86/Kconfig
+@@ -2486,16 +2486,6 @@ config PREFIX_SYMBOLS
+ 	def_bool y
+ 	depends on CALL_PADDING && !CFI_CLANG
+ 
+-menuconfig SPECULATION_MITIGATIONS
+-	bool "Mitigations for speculative execution vulnerabilities"
+-	default y
+-	help
+-	  Say Y here to enable options which enable mitigations for
+-	  speculative execution hardware vulnerabilities.
+-
+-	  If you say N, all mitigations will be disabled. You really
+-	  should know what you are doing to say so.
+-
+ if SPECULATION_MITIGATIONS
+ 
+ config MITIGATION_PAGE_TABLE_ISOLATION
+-- 
+2.43.0
+
diff --git a/ci/diffs/0001-bpf-Fix-a-few-selftest-failures-due-to-llvm18-change.patch b/ci/diffs/0001-bpf-Fix-a-few-selftest-failures-due-to-llvm18-change.patch
new file mode 100644
index 0000000000000..a13d767197413
--- /dev/null
+++ b/ci/diffs/0001-bpf-Fix-a-few-selftest-failures-due-to-llvm18-change.patch
@@ -0,0 +1,94 @@
+From fb9a697860acd8f54f2ba6647923794378eb33da Mon Sep 17 00:00:00 2001
+From: Yonghong Song <yonghong.song@linux.dev>
+Date: Sun, 26 Nov 2023 21:03:42 -0800
+Subject: [PATCH] bpf: Fix a few selftest failures due to llvm18 change
+
+With latest upstream llvm18, the following test cases failed:
+
+  $ ./test_progs -j
+  #13/2    bpf_cookie/multi_kprobe_link_api:FAIL
+  #13/3    bpf_cookie/multi_kprobe_attach_api:FAIL
+  #13      bpf_cookie:FAIL
+  #77      fentry_fexit:FAIL
+  #78/1    fentry_test/fentry:FAIL
+  #78      fentry_test:FAIL
+  #82/1    fexit_test/fexit:FAIL
+  #82      fexit_test:FAIL
+  #112/1   kprobe_multi_test/skel_api:FAIL
+  #112/2   kprobe_multi_test/link_api_addrs:FAIL
+  [...]
+  #112     kprobe_multi_test:FAIL
+  #356/17  test_global_funcs/global_func17:FAIL
+  #356     test_global_funcs:FAIL
+
+Further analysis shows llvm upstream patch [1] is responsible for the above
+failures. For example, for function bpf_fentry_test7() in net/bpf/test_run.c,
+without [1], the asm code is:
+
+  0000000000000400 <bpf_fentry_test7>:
+     400: f3 0f 1e fa                   endbr64
+     404: e8 00 00 00 00                callq   0x409 <bpf_fentry_test7+0x9>
+     409: 48 89 f8                      movq    %rdi, %rax
+     40c: c3                            retq
+     40d: 0f 1f 00                      nopl    (%rax)
+
+... and with [1], the asm code is:
+
+  0000000000005d20 <bpf_fentry_test7.specialized.1>:
+    5d20: e8 00 00 00 00                callq   0x5d25 <bpf_fentry_test7.specialized.1+0x5>
+    5d25: c3                            retq
+
+... and <bpf_fentry_test7.specialized.1> is called instead of <bpf_fentry_test7>
+and this caused test failures for #13/#77 etc. except #356.
+
+For test case #356/17, with [1] (progs/test_global_func17.c)), the main prog
+looks like:
+
+  0000000000000000 <global_func17>:
+       0:       b4 00 00 00 2a 00 00 00 w0 = 0x2a
+       1:       95 00 00 00 00 00 00 00 exit
+
+... which passed verification while the test itself expects a verification
+failure.
+
+Let us add 'barrier_var' style asm code in both places to prevent function
+specialization which caused selftests failure.
+
+  [1] https://github.com/llvm/llvm-project/pull/72903
+
+Signed-off-by: Yonghong Song <yonghong.song@linux.dev>
+Signed-off-by: Daniel Borkmann <daniel@iogearbox.net>
+Link: https://lore.kernel.org/bpf/20231127050342.1945270-1-yonghong.song@linux.dev
+---
+ net/bpf/test_run.c                                     | 2 +-
+ tools/testing/selftests/bpf/progs/test_global_func17.c | 1 +
+ 2 files changed, 2 insertions(+), 1 deletion(-)
+
+diff --git a/net/bpf/test_run.c b/net/bpf/test_run.c
+index c9fdcc5cdce1..711cf5d59816 100644
+--- a/net/bpf/test_run.c
++++ b/net/bpf/test_run.c
+@@ -542,7 +542,7 @@ struct bpf_fentry_test_t {
+ 
+ int noinline bpf_fentry_test7(struct bpf_fentry_test_t *arg)
+ {
+-	asm volatile ("");
++	asm volatile ("": "+r"(arg));
+ 	return (long)arg;
+ }
+ 
+diff --git a/tools/testing/selftests/bpf/progs/test_global_func17.c b/tools/testing/selftests/bpf/progs/test_global_func17.c
+index a32e11c7d933..5de44b09e8ec 100644
+--- a/tools/testing/selftests/bpf/progs/test_global_func17.c
++++ b/tools/testing/selftests/bpf/progs/test_global_func17.c
+@@ -5,6 +5,7 @@
+ 
+ __noinline int foo(int *p)
+ {
++	barrier_var(p);
+ 	return p ? (*p = 42) : 0;
+ }
+ 
+-- 
+2.34.1
+
diff --git a/ci/diffs/0001-bpf-Fix-a-verifier-bug-due-to-incorrect-branch-offse.patch b/ci/diffs/0001-bpf-Fix-a-verifier-bug-due-to-incorrect-branch-offse.patch
new file mode 100644
index 0000000000000..5832a42664706
--- /dev/null
+++ b/ci/diffs/0001-bpf-Fix-a-verifier-bug-due-to-incorrect-branch-offse.patch
@@ -0,0 +1,67 @@
+From dfce9cb3140592b886838e06f3e0c25fea2a9cae Mon Sep 17 00:00:00 2001
+From: Yonghong Song <yonghong.song@linux.dev>
+Date: Thu, 30 Nov 2023 18:46:40 -0800
+Subject: [PATCH 1/1] bpf: Fix a verifier bug due to incorrect branch offset
+ comparison with cpu=v4
+
+Bpf cpu=v4 support is introduced in [1] and Commit 4cd58e9af8b9
+("bpf: Support new 32bit offset jmp instruction") added support for new
+32bit offset jmp instruction. Unfortunately, in function
+bpf_adj_delta_to_off(), for new branch insn with 32bit offset, the offset
+(plus/minor a small delta) compares to 16-bit offset bound
+[S16_MIN, S16_MAX], which caused the following verification failure:
+  $ ./test_progs-cpuv4 -t verif_scale_pyperf180
+  ...
+  insn 10 cannot be patched due to 16-bit range
+  ...
+  libbpf: failed to load object 'pyperf180.bpf.o'
+  scale_test:FAIL:expect_success unexpected error: -12 (errno 12)
+  #405     verif_scale_pyperf180:FAIL
+
+Note that due to recent llvm18 development, the patch [2] (already applied
+in bpf-next) needs to be applied to bpf tree for testing purpose.
+
+The fix is rather simple. For 32bit offset branch insn, the adjusted
+offset compares to [S32_MIN, S32_MAX] and then verification succeeded.
+
+  [1] https://lore.kernel.org/all/20230728011143.3710005-1-yonghong.song@linux.dev
+  [2] https://lore.kernel.org/bpf/20231110193644.3130906-1-yonghong.song@linux.dev
+
+Fixes: 4cd58e9af8b9 ("bpf: Support new 32bit offset jmp instruction")
+Signed-off-by: Yonghong Song <yonghong.song@linux.dev>
+Signed-off-by: Andrii Nakryiko <andrii@kernel.org>
+Link: https://lore.kernel.org/bpf/20231201024640.3417057-1-yonghong.song@linux.dev
+---
+ kernel/bpf/core.c | 12 ++++++++----
+ 1 file changed, 8 insertions(+), 4 deletions(-)
+
+diff --git a/kernel/bpf/core.c b/kernel/bpf/core.c
+index cd3afe57ece3..fe254ae035fe 100644
+--- a/kernel/bpf/core.c
++++ b/kernel/bpf/core.c
+@@ -371,14 +371,18 @@ static int bpf_adj_delta_to_imm(struct bpf_insn *insn, u32 pos, s32 end_old,
+ static int bpf_adj_delta_to_off(struct bpf_insn *insn, u32 pos, s32 end_old,
+ 				s32 end_new, s32 curr, const bool probe_pass)
+ {
+-	const s32 off_min = S16_MIN, off_max = S16_MAX;
++	s64 off_min, off_max, off;
+ 	s32 delta = end_new - end_old;
+-	s32 off;
+ 
+-	if (insn->code == (BPF_JMP32 | BPF_JA))
++	if (insn->code == (BPF_JMP32 | BPF_JA)) {
+ 		off = insn->imm;
+-	else
++		off_min = S32_MIN;
++		off_max = S32_MAX;
++	} else {
+ 		off = insn->off;
++		off_min = S16_MIN;
++		off_max = S16_MAX;
++	}
+ 
+ 	if (curr < pos && curr + off + 1 >= end_old)
+ 		off += delta;
+-- 
+2.34.1
+
diff --git a/ci/diffs/0001-bpf-next-selftests-bpf-Fix-a-btf_dump-selftest-failure.patch b/ci/diffs/0001-bpf-next-selftests-bpf-Fix-a-btf_dump-selftest-failure.patch
new file mode 100644
index 0000000000000..ea6b2386d0345
--- /dev/null
+++ b/ci/diffs/0001-bpf-next-selftests-bpf-Fix-a-btf_dump-selftest-failure.patch
@@ -0,0 +1,40 @@
+From patchwork Fri Aug  2 18:54:34 2024
+From: Yonghong Song <yonghong.song@linux.dev>
+Subject: [PATCH bpf-next] selftests/bpf: Fix a btf_dump selftest failure
+
+Jakub reported bpf selftest "btf_dump" failure after forwarding to
+v6.11-rc1 with netdev.
+  Error: #33 btf_dump
+  Error: #33/15 btf_dump/btf_dump: var_data
+    btf_dump_data:FAIL:find type id unexpected find type id: actual -2 < expected 0
+
+The reason for the failure is due to
+  commit 94ede2a3e913 ("profiling: remove stale percpu flip buffer variables")
+where percpu static variable "cpu_profile_flip" is removed.
+
+Let us replace "cpu_profile_flip" with a variable in bpf subsystem
+so whenever that variable gets deleted or renamed, we can detect the
+failure immediately. In this case, I picked a static percpu variable
+"bpf_cgrp_storage_busy" which is defined in kernel/bpf/bpf_cgrp_storage.c.
+
+Reported-by: Jakub Kicinski <kuba@kernel.org>
+Signed-off-by: Yonghong Song <yonghong.song@linux.dev>
+---
+ tools/testing/selftests/bpf/prog_tests/btf_dump.c | 4 ++--
+ 1 file changed, 2 insertions(+), 2 deletions(-)
+
+diff --git a/tools/testing/selftests/bpf/prog_tests/btf_dump.c b/tools/testing/selftests/bpf/prog_tests/btf_dump.c
+index 09a8e6f9b379..b293b8501fd6 100644
+--- a/tools/testing/selftests/bpf/prog_tests/btf_dump.c
++++ b/tools/testing/selftests/bpf/prog_tests/btf_dump.c
+@@ -805,8 +805,8 @@ static void test_btf_dump_var_data(struct btf *btf, struct btf_dump *d,
+ 	TEST_BTF_DUMP_VAR(btf, d, NULL, str, "cpu_number", int, BTF_F_COMPACT,
+ 			  "int cpu_number = (int)100", 100);
+ #endif
+-	TEST_BTF_DUMP_VAR(btf, d, NULL, str, "cpu_profile_flip", int, BTF_F_COMPACT,
+-			  "static int cpu_profile_flip = (int)2", 2);
++	TEST_BTF_DUMP_VAR(btf, d, NULL, str, "bpf_cgrp_storage_busy", int, BTF_F_COMPACT,
++			  "static int bpf_cgrp_storage_busy = (int)2", 2);
+ }
+ 
+ static void test_btf_datasec(struct btf *btf, struct btf_dump *d, char *str,
diff --git a/ci/diffs/0001-net-bpf-Use-sockopt_lock_sock-in-ip_sock_set_tos.patch b/ci/diffs/0001-net-bpf-Use-sockopt_lock_sock-in-ip_sock_set_tos.patch
new file mode 100644
index 0000000000000..bd12bd9b3fba5
--- /dev/null
+++ b/ci/diffs/0001-net-bpf-Use-sockopt_lock_sock-in-ip_sock_set_tos.patch
@@ -0,0 +1,99 @@
+From c8268f8e9fa33c32e1f2f86fc7b703408a396c70 Mon Sep 17 00:00:00 2001
+From: Yonghong Song <yonghong.song@linux.dev>
+Date: Fri, 27 Oct 2023 11:24:24 -0700
+Subject: [PATCH] net: bpf: Use sockopt_lock_sock() in ip_sock_set_tos()
+
+With latest sync from net-next tree, bpf-next has a bpf selftest failure:
+  [root@arch-fb-vm1 bpf]# ./test_progs -t setget_sockopt
+  ...
+  [   76.194349] ============================================
+  [   76.194682] WARNING: possible recursive locking detected
+  [   76.195039] 6.6.0-rc7-g37884503df08-dirty #67 Tainted: G        W  OE
+  [   76.195518] --------------------------------------------
+  [   76.195852] new_name/154 is trying to acquire lock:
+  [   76.196159] ffff8c3e06ad8d30 (sk_lock-AF_INET){+.+.}-{0:0}, at: ip_sock_set_tos+0x19/0x30
+  [   76.196669]
+  [   76.196669] but task is already holding lock:
+  [   76.197028] ffff8c3e06ad8d30 (sk_lock-AF_INET){+.+.}-{0:0}, at: inet_listen+0x21/0x70
+  [   76.197517]
+  [   76.197517] other info that might help us debug this:
+  [   76.197919]  Possible unsafe locking scenario:
+  [   76.197919]
+  [   76.198287]        CPU0
+  [   76.198444]        ----
+  [   76.198600]   lock(sk_lock-AF_INET);
+  [   76.198831]   lock(sk_lock-AF_INET);
+  [   76.199062]
+  [   76.199062]  *** DEADLOCK ***
+  [   76.199062]
+  [   76.199420]  May be due to missing lock nesting notation
+  [   76.199420]
+  [   76.199879] 2 locks held by new_name/154:
+  [   76.200131]  #0: ffff8c3e06ad8d30 (sk_lock-AF_INET){+.+.}-{0:0}, at: inet_listen+0x21/0x70
+  [   76.200644]  #1: ffffffff90f96a40 (rcu_read_lock){....}-{1:2}, at: __cgroup_bpf_run_filter_sock_ops+0x55/0x290
+  [   76.201268]
+  [   76.201268] stack backtrace:
+  [   76.201538] CPU: 4 PID: 154 Comm: new_name Tainted: G        W  OE      6.6.0-rc7-g37884503df08-dirty #67
+  [   76.202134] Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS 1.13.0-1ubuntu1.1 04/01/2014
+  [   76.202699] Call Trace:
+  [   76.202858]  <TASK>
+  [   76.203002]  dump_stack_lvl+0x4b/0x80
+  [   76.203239]  __lock_acquire+0x740/0x1ec0
+  [   76.203503]  lock_acquire+0xc1/0x2a0
+  [   76.203766]  ? ip_sock_set_tos+0x19/0x30
+  [   76.204050]  ? sk_stream_write_space+0x12a/0x230
+  [   76.204389]  ? lock_release+0xbe/0x260
+  [   76.204661]  lock_sock_nested+0x32/0x80
+  [   76.204942]  ? ip_sock_set_tos+0x19/0x30
+  [   76.205208]  ip_sock_set_tos+0x19/0x30
+  [   76.205452]  do_ip_setsockopt+0x4b3/0x1580
+  [   76.205719]  __bpf_setsockopt+0x62/0xa0
+  [   76.205963]  bpf_sock_ops_setsockopt+0x11/0x20
+  [   76.206247]  bpf_prog_630217292049c96e_bpf_test_sockopt_int+0xbc/0x123
+  [   76.206660]  bpf_prog_493685a3bae00bbd_bpf_test_ip_sockopt+0x49/0x4b
+  [   76.207055]  bpf_prog_b0bcd27f269aeea0_skops_sockopt+0x44c/0xec7
+  [   76.207437]  __cgroup_bpf_run_filter_sock_ops+0xda/0x290
+  [   76.207829]  __inet_listen_sk+0x108/0x1b0
+  [   76.208122]  inet_listen+0x48/0x70
+  [   76.208373]  __sys_listen+0x74/0xb0
+  [   76.208630]  __x64_sys_listen+0x16/0x20
+  [   76.208911]  do_syscall_64+0x3f/0x90
+  [   76.209174]  entry_SYSCALL_64_after_hwframe+0x6e/0xd8
+  ...
+
+Both ip_sock_set_tos() and inet_listen() calls lock_sock(sk) which
+caused a dead lock.
+
+To fix the issue, use sockopt_lock_sock() in ip_sock_set_tos()
+instead. sockopt_lock_sock() will avoid lock_sock() if it is in bpf
+context.
+
+Fixes: 878d951c6712 ("inet: lock the socket in ip_sock_set_tos()")
+Suggested-by: Martin KaFai Lau <martin.lau@kernel.org>
+Signed-off-by: Yonghong Song <yonghong.song@linux.dev>
+Signed-off-by: Andrii Nakryiko <andrii@kernel.org>
+Reviewed-by: Eric Dumazet <edumazet@google.com>
+Link: https://lore.kernel.org/bpf/20231027182424.1444845-1-yonghong.song@linux.dev
+---
+ net/ipv4/ip_sockglue.c | 4 ++--
+ 1 file changed, 2 insertions(+), 2 deletions(-)
+
+diff --git a/net/ipv4/ip_sockglue.c b/net/ipv4/ip_sockglue.c
+index 9c68b6b74d9f..2efc53526a38 100644
+--- a/net/ipv4/ip_sockglue.c
++++ b/net/ipv4/ip_sockglue.c
+@@ -602,9 +602,9 @@ void __ip_sock_set_tos(struct sock *sk, int val)
+ 
+ void ip_sock_set_tos(struct sock *sk, int val)
+ {
+-	lock_sock(sk);
++	sockopt_lock_sock(sk);
+ 	__ip_sock_set_tos(sk, val);
+-	release_sock(sk);
++	sockopt_release_sock(sk);
+ }
+ EXPORT_SYMBOL(ip_sock_set_tos);
+ 
+-- 
+2.34.1
+
diff --git a/ci/diffs/0001-selftests-bpf-Filter-out-_GNU_SOURCE-when-compiling-.patch b/ci/diffs/0001-selftests-bpf-Filter-out-_GNU_SOURCE-when-compiling-.patch
new file mode 100644
index 0000000000000..da5bcdc455967
--- /dev/null
+++ b/ci/diffs/0001-selftests-bpf-Filter-out-_GNU_SOURCE-when-compiling-.patch
@@ -0,0 +1,51 @@
+From 41c24102af7b6236277a214428b203d51a3462df Mon Sep 17 00:00:00 2001
+From: Stanislav Fomichev <sdf@fomichev.me>
+Date: Thu, 25 Jul 2024 14:40:29 -0700
+Subject: [PATCH 1/1] selftests/bpf: Filter out _GNU_SOURCE when compiling
+ test_cpp
+
+Jakub reports build failures when merging linux/master with net tree:
+
+CXX      test_cpp
+In file included from <built-in>:454:
+<command line>:2:9: error: '_GNU_SOURCE' macro redefined [-Werror,-Wmacro-redefined]
+    2 | #define _GNU_SOURCE
+      |         ^
+<built-in>:445:9: note: previous definition is here
+  445 | #define _GNU_SOURCE 1
+
+The culprit is commit cc937dad85ae ("selftests: centralize -D_GNU_SOURCE= to
+CFLAGS in lib.mk") which unconditionally added -D_GNU_SOUCE to CLFAGS.
+Apparently clang++ also unconditionally adds it for the C++ targets [0]
+which causes a conflict. Add small change in the selftests makefile
+to filter it out for test_cpp.
+
+Not sure which tree it should go via, targeting bpf for now, but net
+might be better?
+
+0: https://stackoverflow.com/questions/11670581/why-is-gnu-source-defined-by-default-and-how-to-turn-it-off
+
+Signed-off-by: Stanislav Fomichev <sdf@fomichev.me>
+Signed-off-by: Andrii Nakryiko <andrii@kernel.org>
+Acked-by: Jiri Olsa <jolsa@kernel.org>
+Link: https://lore.kernel.org/bpf/20240725214029.1760809-1-sdf@fomichev.me
+---
+ tools/testing/selftests/bpf/Makefile | 2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+diff --git a/tools/testing/selftests/bpf/Makefile b/tools/testing/selftests/bpf/Makefile
+index dd49c1d23a60..81d4757ecd4c 100644
+--- a/tools/testing/selftests/bpf/Makefile
++++ b/tools/testing/selftests/bpf/Makefile
+@@ -713,7 +713,7 @@ $(OUTPUT)/xdp_features: xdp_features.c $(OUTPUT)/network_helpers.o $(OUTPUT)/xdp
+ # Make sure we are able to include and link libbpf against c++.
+ $(OUTPUT)/test_cpp: test_cpp.cpp $(OUTPUT)/test_core_extern.skel.h $(BPFOBJ)
+ 	$(call msg,CXX,,$@)
+-	$(Q)$(CXX) $(CFLAGS) $(filter %.a %.o %.cpp,$^) $(LDLIBS) -o $@
++	$(Q)$(CXX) $(subst -D_GNU_SOURCE=,,$(CFLAGS)) $(filter %.a %.o %.cpp,$^) $(LDLIBS) -o $@
+ 
+ # Benchmark runner
+ $(OUTPUT)/bench_%.o: benchs/bench_%.c bench.h $(BPFOBJ)
+-- 
+2.43.0
+
diff --git a/ci/diffs/0001-selftests-bpf-Fix-bpf_cookie-and-find_vma-in-nested-.patch b/ci/diffs/0001-selftests-bpf-Fix-bpf_cookie-and-find_vma-in-nested-.patch
new file mode 100644
index 0000000000000..4ebfe20b24707
--- /dev/null
+++ b/ci/diffs/0001-selftests-bpf-Fix-bpf_cookie-and-find_vma-in-nested-.patch
@@ -0,0 +1,50 @@
+From f3d2080e8cf23125f79e345061149ae40f66816f Mon Sep 17 00:00:00 2001
+From: Song Liu <song@kernel.org>
+Date: Mon, 3 Jun 2024 23:43:17 -0700
+Subject: [PATCH bpf-next] selftests/bpf: Fix bpf_cookie and find_vma in nested
+ VM
+
+bpf_cookie and find_vma are flaky in nested VMs, which is used by some CI
+systems. It turns out these failures are caused by unreliable perf event
+in nested VM. Fix these by:
+
+  1. Use PERF_COUNT_SW_CPU_CLOCK in find_vma;
+  2. Increase sample_freq in bpf_cookie.
+
+Signed-off-by: Song Liu <song@kernel.org>
+---
+ tools/testing/selftests/bpf/prog_tests/bpf_cookie.c | 2 +-
+ tools/testing/selftests/bpf/prog_tests/find_vma.c   | 4 ++--
+ 2 files changed, 3 insertions(+), 3 deletions(-)
+
+diff --git a/tools/testing/selftests/bpf/prog_tests/bpf_cookie.c b/tools/testing/selftests/bpf/prog_tests/bpf_cookie.c
+index 4407ea428e77..070c52c312e5 100644
+--- a/tools/testing/selftests/bpf/prog_tests/bpf_cookie.c
++++ b/tools/testing/selftests/bpf/prog_tests/bpf_cookie.c
+@@ -451,7 +451,7 @@ static void pe_subtest(struct test_bpf_cookie *skel)
+ 	attr.type = PERF_TYPE_SOFTWARE;
+ 	attr.config = PERF_COUNT_SW_CPU_CLOCK;
+ 	attr.freq = 1;
+-	attr.sample_freq = 1000;
++	attr.sample_freq = 10000;
+ 	pfd = syscall(__NR_perf_event_open, &attr, -1, 0, -1, PERF_FLAG_FD_CLOEXEC);
+ 	if (!ASSERT_GE(pfd, 0, "perf_fd"))
+ 		goto cleanup;
+diff --git a/tools/testing/selftests/bpf/prog_tests/find_vma.c b/tools/testing/selftests/bpf/prog_tests/find_vma.c
+index 5165b38f0e59..f7619e0ade10 100644
+--- a/tools/testing/selftests/bpf/prog_tests/find_vma.c
++++ b/tools/testing/selftests/bpf/prog_tests/find_vma.c
+@@ -29,8 +29,8 @@ static int open_pe(void)
+ 
+ 	/* create perf event */
+ 	attr.size = sizeof(attr);
+-	attr.type = PERF_TYPE_HARDWARE;
+-	attr.config = PERF_COUNT_HW_CPU_CYCLES;
++	attr.type = PERF_TYPE_SOFTWARE;
++	attr.config = PERF_COUNT_SW_CPU_CLOCK;
+ 	attr.freq = 1;
+ 	attr.sample_freq = 1000;
+ 	pfd = syscall(__NR_perf_event_open, &attr, 0, -1, -1, PERF_FLAG_FD_CLOEXEC);
+-- 
+2.43.0
+
diff --git a/ci/diffs/0001-selftests-bpf-Fix-pyperf180-compilation-failure-with.patch b/ci/diffs/0001-selftests-bpf-Fix-pyperf180-compilation-failure-with.patch
new file mode 100644
index 0000000000000..d55d2e7af8651
--- /dev/null
+++ b/ci/diffs/0001-selftests-bpf-Fix-pyperf180-compilation-failure-with.patch
@@ -0,0 +1,78 @@
+From 100888fb6d8a185866b1520031ee7e3182b173de Mon Sep 17 00:00:00 2001
+From: Yonghong Song <yonghong.song@linux.dev>
+Date: Fri, 10 Nov 2023 11:36:44 -0800
+Subject: [PATCH] selftests/bpf: Fix pyperf180 compilation failure with clang18
+
+With latest clang18 (main branch of llvm-project repo), when building bpf selftests,
+    [~/work/bpf-next (master)]$ make -C tools/testing/selftests/bpf LLVM=1 -j
+
+The following compilation error happens:
+    fatal error: error in backend: Branch target out of insn range
+    ...
+    Stack dump:
+    0.      Program arguments: clang -g -Wall -Werror -D__TARGET_ARCH_x86 -mlittle-endian
+      -I/home/yhs/work/bpf-next/tools/testing/selftests/bpf/tools/include
+      -I/home/yhs/work/bpf-next/tools/testing/selftests/bpf -I/home/yhs/work/bpf-next/tools/include/uapi
+      -I/home/yhs/work/bpf-next/tools/testing/selftests/usr/include -idirafter
+      /home/yhs/work/llvm-project/llvm/build.18/install/lib/clang/18/include -idirafter /usr/local/include
+      -idirafter /usr/include -Wno-compare-distinct-pointer-types -DENABLE_ATOMICS_TESTS -O2 --target=bpf
+      -c progs/pyperf180.c -mcpu=v3 -o /home/yhs/work/bpf-next/tools/testing/selftests/bpf/pyperf180.bpf.o
+    1.      <eof> parser at end of file
+    2.      Code generation
+    ...
+
+The compilation failure only happens to cpu=v2 and cpu=v3. cpu=v4 is okay
+since cpu=v4 supports 32-bit branch target offset.
+
+The above failure is due to upstream llvm patch [1] where some inlining behavior
+are changed in clang18.
+
+To workaround the issue, previously all 180 loop iterations are fully unrolled.
+The bpf macro __BPF_CPU_VERSION__ (implemented in clang18 recently) is used to avoid
+unrolling changes if cpu=v4. If __BPF_CPU_VERSION__ is not available and the
+compiler is clang18, the unrollng amount is unconditionally reduced.
+
+  [1] https://github.com/llvm/llvm-project/commit/1a2e77cf9e11dbf56b5720c607313a566eebb16e
+
+Signed-off-by: Yonghong Song <yonghong.song@linux.dev>
+Signed-off-by: Andrii Nakryiko <andrii@kernel.org>
+Tested-by: Alan Maguire <alan.maguire@oracle.com>
+Link: https://lore.kernel.org/bpf/20231110193644.3130906-1-yonghong.song@linux.dev
+---
+ tools/testing/selftests/bpf/progs/pyperf180.c | 22 +++++++++++++++++++
+ 1 file changed, 22 insertions(+)
+
+diff --git a/tools/testing/selftests/bpf/progs/pyperf180.c b/tools/testing/selftests/bpf/progs/pyperf180.c
+index c39f559d3100..42c4a8b62e36 100644
+--- a/tools/testing/selftests/bpf/progs/pyperf180.c
++++ b/tools/testing/selftests/bpf/progs/pyperf180.c
+@@ -1,4 +1,26 @@
+ // SPDX-License-Identifier: GPL-2.0
+ // Copyright (c) 2019 Facebook
+ #define STACK_MAX_LEN 180
++
++/* llvm upstream commit at clang18
++ *   https://github.com/llvm/llvm-project/commit/1a2e77cf9e11dbf56b5720c607313a566eebb16e
++ * changed inlining behavior and caused compilation failure as some branch
++ * target distance exceeded 16bit representation which is the maximum for
++ * cpu v1/v2/v3. Macro __BPF_CPU_VERSION__ is later implemented in clang18
++ * to specify which cpu version is used for compilation. So a smaller
++ * unroll_count can be set if __BPF_CPU_VERSION__ is less than 4, which
++ * reduced some branch target distances and resolved the compilation failure.
++ *
++ * To capture the case where a developer/ci uses clang18 but the corresponding
++ * repo checkpoint does not have __BPF_CPU_VERSION__, a smaller unroll_count
++ * will be set as well to prevent potential compilation failures.
++ */
++#ifdef __BPF_CPU_VERSION__
++#if __BPF_CPU_VERSION__ < 4
++#define UNROLL_COUNT 90
++#endif
++#elif __clang_major__ == 18
++#define UNROLL_COUNT 90
++#endif
++
+ #include "pyperf.h"
+-- 
+2.34.1
+
diff --git a/ci/diffs/0001-selftests-bpf-disable-detection-of-llvm-when-buildin.patch b/ci/diffs/0001-selftests-bpf-disable-detection-of-llvm-when-buildin.patch
new file mode 100644
index 0000000000000..6497a6cc38c90
--- /dev/null
+++ b/ci/diffs/0001-selftests-bpf-disable-detection-of-llvm-when-buildin.patch
@@ -0,0 +1,41 @@
+From 42839864a62ee244ec280b09149b1cb439f681db Mon Sep 17 00:00:00 2001
+From: Manu Bretelle <chantr4@gmail.com>
+Date: Fri, 27 Oct 2023 18:25:39 -0700
+Subject: [PATCH bpf-next] selftests/bpf: disable detection of llvm when
+ building bpftool
+
+The VMs in which we run the selftests do not have llvm installed.
+We build selftests/bpftool in a host that have llvm.
+bpftool currently will use llvm first and fallback to libbfd but there
+is no way to disable detection from the command line.
+
+Removing it from the feature detection should force us to use libbfd.
+
+Signed-off-by: Manu Bretelle <chantr4@gmail.com>
+---
+ tools/bpf/bpftool/Makefile | 2 --
+ 1 file changed, 2 deletions(-)
+
+diff --git a/tools/bpf/bpftool/Makefile b/tools/bpf/bpftool/Makefile
+index e9154ace80ff..01314458e25e 100644
+--- a/tools/bpf/bpftool/Makefile
++++ b/tools/bpf/bpftool/Makefile
+@@ -95,7 +95,6 @@ RM ?= rm -f
+ FEATURE_USER = .bpftool
+ 
+ FEATURE_TESTS := clang-bpf-co-re
+-FEATURE_TESTS += llvm
+ FEATURE_TESTS += libcap
+ FEATURE_TESTS += libbfd
+ FEATURE_TESTS += libbfd-liberty
+@@ -104,7 +103,6 @@ FEATURE_TESTS += disassembler-four-args
+ FEATURE_TESTS += disassembler-init-styled
+ 
+ FEATURE_DISPLAY := clang-bpf-co-re
+-FEATURE_DISPLAY += llvm
+ FEATURE_DISPLAY += libcap
+ FEATURE_DISPLAY += libbfd
+ FEATURE_DISPLAY += libbfd-liberty
+-- 
+2.39.3
+
diff --git a/ci/diffs/0001-selftests-bpf-fix-inet_csk_accept-prototype-in-test_.patch b/ci/diffs/0001-selftests-bpf-fix-inet_csk_accept-prototype-in-test_.patch
new file mode 100644
index 0000000000000..3fa007c51db68
--- /dev/null
+++ b/ci/diffs/0001-selftests-bpf-fix-inet_csk_accept-prototype-in-test_.patch
@@ -0,0 +1,32 @@
+From 0daad0a615e687e1247230f3d0c31ae60ba32314 Mon Sep 17 00:00:00 2001
+From: Andrii Nakryiko <andrii@kernel.org>
+Date: Tue, 28 May 2024 15:29:38 -0700
+Subject: [PATCH bpf-next] selftests/bpf: fix inet_csk_accept prototype in
+ test_sk_storage_tracing.c
+
+Recent kernel change ([0]) changed inet_csk_accept() prototype. Adapt
+progs/test_sk_storage_tracing.c to take that into account.
+
+  [0] 92ef0fd55ac8 ("net: change proto and proto_ops accept type")
+
+Signed-off-by: Andrii Nakryiko <andrii@kernel.org>
+---
+ tools/testing/selftests/bpf/progs/test_sk_storage_tracing.c | 2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+diff --git a/tools/testing/selftests/bpf/progs/test_sk_storage_tracing.c b/tools/testing/selftests/bpf/progs/test_sk_storage_tracing.c
+index 02e718f06e0f..40531e56776e 100644
+--- a/tools/testing/selftests/bpf/progs/test_sk_storage_tracing.c
++++ b/tools/testing/selftests/bpf/progs/test_sk_storage_tracing.c
+@@ -84,7 +84,7 @@ int BPF_PROG(trace_tcp_connect, struct sock *sk)
+ }
+ 
+ SEC("fexit/inet_csk_accept")
+-int BPF_PROG(inet_csk_accept, struct sock *sk, int flags, int *err, bool kern,
++int BPF_PROG(inet_csk_accept, struct sock *sk, struct proto_accept_arg *arg,
+ 	     struct sock *accepted_sk)
+ {
+ 	set_task_info(accepted_sk);
+-- 
+2.43.0
+
diff --git a/ci/diffs/0001-selftests-bpf-work-around-latest-Clang-smartness.patch b/ci/diffs/0001-selftests-bpf-work-around-latest-Clang-smartness.patch
new file mode 100644
index 0000000000000..ec1e29a8ab974
--- /dev/null
+++ b/ci/diffs/0001-selftests-bpf-work-around-latest-Clang-smartness.patch
@@ -0,0 +1,31 @@
+From d31a7125891994681503770cff46a119692fb2b9 Mon Sep 17 00:00:00 2001
+From: Andrii Nakryiko <andrii@kernel.org>
+Date: Mon, 11 Dec 2023 17:09:38 -0800
+Subject: [PATCH 1/1] selftests/bpf: work around latest Clang smartness
+
+Work around the issue while we deal with it in the Clang itself.
+See [0].
+
+  [0] https://github.com/llvm/llvm-project/pull/73662#issuecomment-1849281758
+
+Signed-off-by: Andrii Nakryiko <andrii@kernel.org>
+---
+ tools/testing/selftests/bpf/progs/iters.c | 2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+diff --git a/tools/testing/selftests/bpf/progs/iters.c b/tools/testing/selftests/bpf/progs/iters.c
+index 3aca3dc145b5..929ba6fa2105 100644
+--- a/tools/testing/selftests/bpf/progs/iters.c
++++ b/tools/testing/selftests/bpf/progs/iters.c
+@@ -1420,7 +1420,7 @@ SEC("raw_tp")
+ __success
+ int iter_arr_with_actual_elem_count(const void *ctx)
+ {
+-	int i, n = loop_data.n, sum = 0;
++	unsigned i, n = loop_data.n, sum = 0;
+ 
+ 	if (n > ARRAY_SIZE(loop_data.data))
+ 		return 0;
+-- 
+2.34.1
+
diff --git a/ci/diffs/0001-selftests-bpf-xskxceiver-ksft_print_msg-fix-format-t.patch b/ci/diffs/0001-selftests-bpf-xskxceiver-ksft_print_msg-fix-format-t.patch
new file mode 100644
index 0000000000000..e631fac0cc698
--- /dev/null
+++ b/ci/diffs/0001-selftests-bpf-xskxceiver-ksft_print_msg-fix-format-t.patch
@@ -0,0 +1,89 @@
+From fe69a1b1b6ed9ffc2c578c63f526026a8ab74f0c Mon Sep 17 00:00:00 2001
+From: Anders Roxell <anders.roxell@linaro.org>
+Date: Thu, 9 Nov 2023 18:43:28 +0100
+Subject: [PATCH] selftests: bpf: xskxceiver: ksft_print_msg: fix format type
+ error
+
+Crossbuilding selftests/bpf for architecture arm64, format specifies
+type error show up like.
+
+xskxceiver.c:912:34: error: format specifies type 'int' but the argument
+has type '__u64' (aka 'unsigned long long') [-Werror,-Wformat]
+ ksft_print_msg("[%s] expected meta_count [%d], got meta_count [%d]\n",
+                                                                ~~
+                                                                %llu
+                __func__, pkt->pkt_nb, meta->count);
+                                       ^~~~~~~~~~~
+xskxceiver.c:929:55: error: format specifies type 'unsigned long long' but
+ the argument has type 'u64' (aka 'unsigned long') [-Werror,-Wformat]
+ ksft_print_msg("Frag invalid addr: %llx len: %u\n", addr, len);
+                                    ~~~~             ^~~~
+
+Fixing the issues by casting to (unsigned long long) and changing the
+specifiers to be %llu from %d and %u, since with u64s it might be %llx
+or %lx, depending on architecture.
+
+Signed-off-by: Anders Roxell <anders.roxell@linaro.org>
+Link: https://lore.kernel.org/r/20231109174328.1774571-1-anders.roxell@linaro.org
+Signed-off-by: Alexei Starovoitov <ast@kernel.org>
+---
+ tools/testing/selftests/bpf/xskxceiver.c | 19 ++++++++++++-------
+ 1 file changed, 12 insertions(+), 7 deletions(-)
+
+diff --git a/tools/testing/selftests/bpf/xskxceiver.c b/tools/testing/selftests/bpf/xskxceiver.c
+index 591ca9637b23..b604c570309a 100644
+--- a/tools/testing/selftests/bpf/xskxceiver.c
++++ b/tools/testing/selftests/bpf/xskxceiver.c
+@@ -908,8 +908,9 @@ static bool is_metadata_correct(struct pkt *pkt, void *buffer, u64 addr)
+ 	struct xdp_info *meta = data - sizeof(struct xdp_info);
+ 
+ 	if (meta->count != pkt->pkt_nb) {
+-		ksft_print_msg("[%s] expected meta_count [%d], got meta_count [%d]\n",
+-			       __func__, pkt->pkt_nb, meta->count);
++		ksft_print_msg("[%s] expected meta_count [%d], got meta_count [%llu]\n",
++			       __func__, pkt->pkt_nb,
++			       (unsigned long long)meta->count);
+ 		return false;
+ 	}
+ 
+@@ -926,11 +927,13 @@ static bool is_frag_valid(struct xsk_umem_info *umem, u64 addr, u32 len, u32 exp
+ 
+ 	if (addr >= umem->num_frames * umem->frame_size ||
+ 	    addr + len > umem->num_frames * umem->frame_size) {
+-		ksft_print_msg("Frag invalid addr: %llx len: %u\n", addr, len);
++		ksft_print_msg("Frag invalid addr: %llx len: %u\n",
++			       (unsigned long long)addr, len);
+ 		return false;
+ 	}
+ 	if (!umem->unaligned_mode && addr % umem->frame_size + len > umem->frame_size) {
+-		ksft_print_msg("Frag crosses frame boundary addr: %llx len: %u\n", addr, len);
++		ksft_print_msg("Frag crosses frame boundary addr: %llx len: %u\n",
++			       (unsigned long long)addr, len);
+ 		return false;
+ 	}
+ 
+@@ -1029,7 +1032,8 @@ static int complete_pkts(struct xsk_socket_info *xsk, int batch_size)
+ 			u64 addr = *xsk_ring_cons__comp_addr(&xsk->umem->cq, idx + rcvd - 1);
+ 
+ 			ksft_print_msg("[%s] Too many packets completed\n", __func__);
+-			ksft_print_msg("Last completion address: %llx\n", addr);
++			ksft_print_msg("Last completion address: %llx\n",
++				       (unsigned long long)addr);
+ 			return TEST_FAILURE;
+ 		}
+ 
+@@ -1513,8 +1517,9 @@ static int validate_tx_invalid_descs(struct ifobject *ifobject)
+ 	}
+ 
+ 	if (stats.tx_invalid_descs != ifobject->xsk->pkt_stream->nb_pkts / 2) {
+-		ksft_print_msg("[%s] tx_invalid_descs incorrect. Got [%u] expected [%u]\n",
+-			       __func__, stats.tx_invalid_descs,
++		ksft_print_msg("[%s] tx_invalid_descs incorrect. Got [%llu] expected [%u]\n",
++			       __func__,
++			       (unsigned long long)stats.tx_invalid_descs,
+ 			       ifobject->xsk->pkt_stream->nb_pkts);
+ 		return TEST_FAILURE;
+ 	}
+-- 
+2.34.1
+
diff --git a/ci/diffs/0001-tools-resolve_btfids-fix-cross-compilation-to-non-host-endianness.patch b/ci/diffs/0001-tools-resolve_btfids-fix-cross-compilation-to-non-host-endianness.patch
new file mode 100644
index 0000000000000..19d269de7e8ca
--- /dev/null
+++ b/ci/diffs/0001-tools-resolve_btfids-fix-cross-compilation-to-non-host-endianness.patch
@@ -0,0 +1,142 @@
+From 3772e6cdb51f21a11df2acf6aa431cc8b9137bfb Mon Sep 17 00:00:00 2001
+From: Viktor Malik <vmalik@redhat.com>
+Date: Tue, 6 Feb 2024 13:46:09 +0100
+Subject: [PATCH 1/2] tools/resolve_btfids: Refactor set sorting with types
+ from btf_ids.h
+
+Instead of using magic offsets to access BTF ID set data, leverage types
+from btf_ids.h (btf_id_set and btf_id_set8) which define the actual
+layout of the data. Thanks to this change, set sorting should also
+continue working if the layout changes.
+
+This requires to sync the definition of 'struct btf_id_set8' from
+include/linux/btf_ids.h to tools/include/linux/btf_ids.h. We don't sync
+the rest of the file at the moment, b/c that would require to also sync
+multiple dependent headers and we don't need any other defs from
+btf_ids.h.
+
+Signed-off-by: Viktor Malik <vmalik@redhat.com>
+Signed-off-by: Andrii Nakryiko <andrii@kernel.org>
+Acked-by: Daniel Xu <dxu@dxuuu.xyz>
+Link: https://lore.kernel.org/bpf/ff7f062ddf6a00815fda3087957c4ce667f50532.1707223196.git.vmalik@redhat.com
+---
+ tools/bpf/resolve_btfids/main.c | 35 ++++++++++++++++++++-------------
+ tools/include/linux/btf_ids.h   |  9 +++++++++
+ 2 files changed, 30 insertions(+), 14 deletions(-)
+
+diff --git a/tools/bpf/resolve_btfids/main.c b/tools/bpf/resolve_btfids/main.c
+index 27a23196d58e..32634f00abba 100644
+--- a/tools/bpf/resolve_btfids/main.c
++++ b/tools/bpf/resolve_btfids/main.c
+@@ -70,6 +70,7 @@
+ #include <sys/stat.h>
+ #include <fcntl.h>
+ #include <errno.h>
++#include <linux/btf_ids.h>
+ #include <linux/rbtree.h>
+ #include <linux/zalloc.h>
+ #include <linux/err.h>
+@@ -78,7 +79,7 @@
+ #include <subcmd/parse-options.h>
+ 
+ #define BTF_IDS_SECTION	".BTF_ids"
+-#define BTF_ID		"__BTF_ID__"
++#define BTF_ID_PREFIX	"__BTF_ID__"
+ 
+ #define BTF_STRUCT	"struct"
+ #define BTF_UNION	"union"
+@@ -161,7 +162,7 @@ static int eprintf(int level, int var, const char *fmt, ...)
+ 
+ static bool is_btf_id(const char *name)
+ {
+-	return name && !strncmp(name, BTF_ID, sizeof(BTF_ID) - 1);
++	return name && !strncmp(name, BTF_ID_PREFIX, sizeof(BTF_ID_PREFIX) - 1);
+ }
+ 
+ static struct btf_id *btf_id__find(struct rb_root *root, const char *name)
+@@ -441,7 +442,7 @@ static int symbols_collect(struct object *obj)
+ 		 * __BTF_ID__TYPE__vfs_truncate__0
+ 		 * prefix =  ^
+ 		 */
+-		prefix = name + sizeof(BTF_ID) - 1;
++		prefix = name + sizeof(BTF_ID_PREFIX) - 1;
+ 
+ 		/* struct */
+ 		if (!strncmp(prefix, BTF_STRUCT, sizeof(BTF_STRUCT) - 1)) {
+@@ -649,19 +650,18 @@ static int cmp_id(const void *pa, const void *pb)
+ static int sets_patch(struct object *obj)
+ {
+ 	Elf_Data *data = obj->efile.idlist;
+-	int *ptr = data->d_buf;
+ 	struct rb_node *next;
+ 
+ 	next = rb_first(&obj->sets);
+ 	while (next) {
+-		unsigned long addr, idx;
++		struct btf_id_set8 *set8;
++		struct btf_id_set *set;
++		unsigned long addr, off;
+ 		struct btf_id *id;
+-		int *base;
+-		int cnt;
+ 
+ 		id   = rb_entry(next, struct btf_id, rb_node);
+ 		addr = id->addr[0];
+-		idx  = addr - obj->efile.idlist_addr;
++		off = addr - obj->efile.idlist_addr;
+ 
+ 		/* sets are unique */
+ 		if (id->addr_cnt != 1) {
+@@ -670,14 +670,21 @@ static int sets_patch(struct object *obj)
+ 			return -1;
+ 		}
+ 
+-		idx = idx / sizeof(int);
+-		base = &ptr[idx] + (id->is_set8 ? 2 : 1);
+-		cnt = ptr[idx];
++		if (id->is_set) {
++			set = data->d_buf + off;
++			qsort(set->ids, set->cnt, sizeof(set->ids[0]), cmp_id);
++		} else {
++			set8 = data->d_buf + off;
++			/*
++			 * Make sure id is at the beginning of the pairs
++			 * struct, otherwise the below qsort would not work.
++			 */
++			BUILD_BUG_ON(set8->pairs != &set8->pairs[0].id);
++			qsort(set8->pairs, set8->cnt, sizeof(set8->pairs[0]), cmp_id);
++		}
+ 
+ 		pr_debug("sorting  addr %5lu: cnt %6d [%s]\n",
+-			 (idx + 1) * sizeof(int), cnt, id->name);
+-
+-		qsort(base, cnt, id->is_set8 ? sizeof(uint64_t) : sizeof(int), cmp_id);
++			 off, id->is_set ? set->cnt : set8->cnt, id->name);
+ 
+ 		next = rb_next(next);
+ 	}
+diff --git a/tools/include/linux/btf_ids.h b/tools/include/linux/btf_ids.h
+index 2f882d5cb30f..72535f00572f 100644
+--- a/tools/include/linux/btf_ids.h
++++ b/tools/include/linux/btf_ids.h
+@@ -8,6 +8,15 @@ struct btf_id_set {
+ 	u32 ids[];
+ };
+ 
++struct btf_id_set8 {
++	u32 cnt;
++	u32 flags;
++	struct {
++		u32 id;
++		u32 flags;
++	} pairs[];
++};
++
+ #ifdef CONFIG_DEBUG_INFO_BTF
+ 
+ #include <linux/compiler.h> /* for __PASTE */
+-- 
+2.39.3
+
+
+
diff --git a/ci/diffs/0001-tracing-kprobes-Fix-symbol-counting-logic-by-looking.patch b/ci/diffs/0001-tracing-kprobes-Fix-symbol-counting-logic-by-looking.patch
new file mode 100644
index 0000000000000..24ebc231056cb
--- /dev/null
+++ b/ci/diffs/0001-tracing-kprobes-Fix-symbol-counting-logic-by-looking.patch
@@ -0,0 +1,65 @@
+From 08969a676d234a178ff9f8c67936a2ad98a741eb Mon Sep 17 00:00:00 2001
+From: Andrii Nakryiko <andrii@kernel.org>
+Date: Fri, 27 Oct 2023 16:22:24 -0700
+Subject: [PATCH] tracing/kprobes: Fix symbol counting logic by looking at
+ modules as well
+
+Recent changes to count number of matching symbols when creating
+a kprobe event failed to take into account kernel modules. As such, it
+breaks kprobes on kernel module symbols, by assuming there is no match.
+
+Fix this my calling module_kallsyms_on_each_symbol() in addition to
+kallsyms_on_each_match_symbol() to perform a proper counting.
+
+Cc: Francis Laniel <flaniel@linux.microsoft.com>
+Cc: stable@vger.kernel.org
+Cc: Masami Hiramatsu <mhiramat@kernel.org>
+Cc: Steven Rostedt <rostedt@goodmis.org>
+Fixes: b022f0c7e404 ("tracing/kprobes: Return EADDRNOTAVAIL when func matches several symbols")
+Signed-off-by: Andrii Nakryiko <andrii@kernel.org>
+---
+ kernel/trace/trace_kprobe.c | 24 ++++++++++++++++++++----
+ 1 file changed, 20 insertions(+), 4 deletions(-)
+
+diff --git a/kernel/trace/trace_kprobe.c b/kernel/trace/trace_kprobe.c
+index effcaede4759..1efb27f35963 100644
+--- a/kernel/trace/trace_kprobe.c
++++ b/kernel/trace/trace_kprobe.c
+@@ -714,14 +714,30 @@ static int count_symbols(void *data, unsigned long unused)
+ 	return 0;
+ }
+ 
++struct sym_count_ctx {
++	unsigned int count;
++	const char *name;
++};
++
++static int count_mod_symbols(void *data, const char *name, unsigned long unused)
++{
++	struct sym_count_ctx *ctx = data;
++
++	if (strcmp(name, ctx->name) == 0)
++		ctx->count++;
++
++	return 0;
++}
++
+ static unsigned int number_of_same_symbols(char *func_name)
+ {
+-	unsigned int count;
++	struct sym_count_ctx ctx = { .count = 0, .name = func_name };
++
++	kallsyms_on_each_match_symbol(count_symbols, func_name, &ctx.count);
+ 
+-	count = 0;
+-	kallsyms_on_each_match_symbol(count_symbols, func_name, &count);
++	module_kallsyms_on_each_symbol(NULL, count_mod_symbols, &ctx);
+ 
+-	return count;
++	return ctx.count;
+ }
+ 
+ static int __trace_kprobe_create(int argc, const char *argv[])
+-- 
+2.34.1
+
diff --git a/ci/diffs/0002-tools-resolve_btfids-fix-cross-compilation-to-non-host-endianness.patch b/ci/diffs/0002-tools-resolve_btfids-fix-cross-compilation-to-non-host-endianness.patch
new file mode 100644
index 0000000000000..c4d67693bd132
--- /dev/null
+++ b/ci/diffs/0002-tools-resolve_btfids-fix-cross-compilation-to-non-host-endianness.patch
@@ -0,0 +1,117 @@
+From c3dcadfdf2bf8f01471066700c098b5185240df6 Mon Sep 17 00:00:00 2001
+From: Viktor Malik <vmalik@redhat.com>
+Date: Tue, 6 Feb 2024 13:46:10 +0100
+Subject: [PATCH 2/2] tools/resolve_btfids: Fix cross-compilation to non-host
+ endianness
+
+The .BTF_ids section is pre-filled with zeroed BTF ID entries during the
+build and afterwards patched by resolve_btfids with correct values.
+Since resolve_btfids always writes in host-native endianness, it relies
+on libelf to do the translation when the target ELF is cross-compiled to
+a different endianness (this was introduced in commit 61e8aeda9398
+("bpf: Fix libelf endian handling in resolv_btfids")).
+
+Unfortunately, the translation will corrupt the flags fields of SET8
+entries because these were written during vmlinux compilation and are in
+the correct endianness already. This will lead to numerous selftests
+failures such as:
+
+    $ sudo ./test_verifier 502 502
+    #502/p sleepable fentry accept FAIL
+    Failed to load prog 'Invalid argument'!
+    bpf_fentry_test1 is not sleepable
+    verification time 34 usec
+    stack depth 0
+    processed 0 insns (limit 1000000) max_states_per_insn 0 total_states 0 peak_states 0 mark_read 0
+    Summary: 0 PASSED, 0 SKIPPED, 1 FAILED
+
+Since it's not possible to instruct libelf to translate just certain
+values, let's manually bswap the flags (both global and entry flags) in
+resolve_btfids when needed, so that libelf then translates everything
+correctly.
+
+Fixes: ef2c6f370a63 ("tools/resolve_btfids: Add support for 8-byte BTF sets")
+Signed-off-by: Viktor Malik <vmalik@redhat.com>
+Signed-off-by: Andrii Nakryiko <andrii@kernel.org>
+Link: https://lore.kernel.org/bpf/7b6bff690919555574ce0f13d2a5996cacf7bf69.1707223196.git.vmalik@redhat.com
+---
+ tools/bpf/resolve_btfids/main.c | 35 +++++++++++++++++++++++++++++++++
+ 1 file changed, 35 insertions(+)
+
+diff --git a/tools/bpf/resolve_btfids/main.c b/tools/bpf/resolve_btfids/main.c
+index 32634f00abba..d9520cb826b3 100644
+--- a/tools/bpf/resolve_btfids/main.c
++++ b/tools/bpf/resolve_btfids/main.c
+@@ -90,6 +90,14 @@
+ 
+ #define ADDR_CNT	100
+ 
++#if __BYTE_ORDER == __LITTLE_ENDIAN
++# define ELFDATANATIVE	ELFDATA2LSB
++#elif __BYTE_ORDER == __BIG_ENDIAN
++# define ELFDATANATIVE	ELFDATA2MSB
++#else
++# error "Unknown machine endianness!"
++#endif
++
+ struct btf_id {
+ 	struct rb_node	 rb_node;
+ 	char		*name;
+@@ -117,6 +125,7 @@ struct object {
+ 		int		 idlist_shndx;
+ 		size_t		 strtabidx;
+ 		unsigned long	 idlist_addr;
++		int		 encoding;
+ 	} efile;
+ 
+ 	struct rb_root	sets;
+@@ -320,6 +329,7 @@ static int elf_collect(struct object *obj)
+ {
+ 	Elf_Scn *scn = NULL;
+ 	size_t shdrstrndx;
++	GElf_Ehdr ehdr;
+ 	int idx = 0;
+ 	Elf *elf;
+ 	int fd;
+@@ -351,6 +361,13 @@ static int elf_collect(struct object *obj)
+ 		return -1;
+ 	}
+ 
++	if (gelf_getehdr(obj->efile.elf, &ehdr) == NULL) {
++		pr_err("FAILED cannot get ELF header: %s\n",
++			elf_errmsg(-1));
++		return -1;
++	}
++	obj->efile.encoding = ehdr.e_ident[EI_DATA];
++
+ 	/*
+ 	 * Scan all the elf sections and look for save data
+ 	 * from .BTF_ids section and symbols.
+@@ -681,6 +698,24 @@ static int sets_patch(struct object *obj)
+ 			 */
+ 			BUILD_BUG_ON(set8->pairs != &set8->pairs[0].id);
+ 			qsort(set8->pairs, set8->cnt, sizeof(set8->pairs[0]), cmp_id);
++
++			/*
++			 * When ELF endianness does not match endianness of the
++			 * host, libelf will do the translation when updating
++			 * the ELF. This, however, corrupts SET8 flags which are
++			 * already in the target endianness. So, let's bswap
++			 * them to the host endianness and libelf will then
++			 * correctly translate everything.
++			 */
++			if (obj->efile.encoding != ELFDATANATIVE) {
++				int i;
++
++				set8->flags = bswap_32(set8->flags);
++				for (i = 0; i < set8->cnt; i++) {
++					set8->pairs[i].flags =
++						bswap_32(set8->pairs[i].flags);
++				}
++			}
+ 		}
+ 
+ 		pr_debug("sorting  addr %5lu: cnt %6d [%s]\n",
+-- 
+2.39.3
+
diff --git a/ci/diffs/0099-s390x_nolockdep.diff b/ci/diffs/0099-s390x_nolockdep.diff
new file mode 100644
index 0000000000000..44c2d1a520656
--- /dev/null
+++ b/ci/diffs/0099-s390x_nolockdep.diff
@@ -0,0 +1,48 @@
+From 470d0c7874ac638ea62cddc3a20ec047fa4ab539 Mon Sep 17 00:00:00 2001
+From: Manu Bretelle <chantr4@gmail.com>
+Date: Wed, 14 Feb 2024 17:25:35 -0800
+Subject: [PATCH] bpf/selftests: disable lockdep on s390x
+
+Tests are slow to run on s390x, this should make them faster.
+
+Signed-off-by: Manu Bretelle <chantr4@gmail.com>
+---
+ tools/testing/selftests/bpf/config.s390x | 8 ++++----
+ 1 file changed, 4 insertions(+), 4 deletions(-)
+
+diff --git a/tools/testing/selftests/bpf/config.s390x b/tools/testing/selftests/bpf/config.s390x
+index 706931a8c2c69..67bfd62b0b582 100644
+--- a/tools/testing/selftests/bpf/config.s390x
++++ b/tools/testing/selftests/bpf/config.s390x
+@@ -23,11 +23,11 @@ CONFIG_CPUSETS=y
+ CONFIG_CRASH_DUMP=y
+ CONFIG_CRYPTO_USER_API_RNG=y
+ CONFIG_CRYPTO_USER_API_SKCIPHER=y
+-CONFIG_DEBUG_ATOMIC_SLEEP=y
++CONFIG_DEBUG_ATOMIC_SLEEP=n
+ CONFIG_DEBUG_INFO_BTF=y
+ CONFIG_DEBUG_INFO_DWARF4=y
+ CONFIG_DEBUG_LIST=y
+-CONFIG_DEBUG_LOCKDEP=y
++CONFIG_DEBUG_LOCKDEP=n
+ CONFIG_DEBUG_NOTIFIERS=y
+ CONFIG_DEBUG_PAGEALLOC=y
+ CONFIG_DEBUG_SECTION_MISMATCH=y
+@@ -71,7 +71,7 @@ CONFIG_KRETPROBES=y
+ CONFIG_KSM=y
+ CONFIG_LATENCYTOP=y
+ CONFIG_LIVEPATCH=y
+-CONFIG_LOCK_STAT=y
++CONFIG_LOCK_STAT=n
+ CONFIG_MACVLAN=y
+ CONFIG_MACVTAP=y
+ CONFIG_MAGIC_SYSRQ=y
+@@ -101,7 +101,7 @@ CONFIG_PCI=y
+ CONFIG_POSIX_MQUEUE=y
+ CONFIG_PROC_KCORE=y
+ CONFIG_PROFILING=y
+-CONFIG_PROVE_LOCKING=y
++CONFIG_PROVE_LOCKING=n
+ CONFIG_PTDUMP_DEBUGFS=y
+ CONFIG_RC_DEVICES=y
+ CONFIG_RC_LOOPBACK=y
diff --git a/ci/diffs/0099-selftest-cross-compile.diff b/ci/diffs/0099-selftest-cross-compile.diff
new file mode 100644
index 0000000000000..e8732596bdb3f
--- /dev/null
+++ b/ci/diffs/0099-selftest-cross-compile.diff
@@ -0,0 +1,13 @@
+diff --git a/tools/testing/selftests/bpf/Makefile b/tools/testing/selftests/bpf/Makefile
+index a38a3001527c..af68528cc944 100644
+--- a/tools/testing/selftests/bpf/Makefile
++++ b/tools/testing/selftests/bpf/Makefile
+@@ -304,7 +304,7 @@ $(OUTPUT)/test_maps: $(TESTING_HELPERS)
+ $(OUTPUT)/test_verifier: $(TESTING_HELPERS) $(CAP_HELPERS) $(UNPRIV_HELPERS)
+ $(OUTPUT)/xsk.o: $(BPFOBJ)
+ 
+-BPFTOOL ?= $(DEFAULT_BPFTOOL)
++BPFTOOL ?= $(TRUNNER_BPFTOOL)
+ $(DEFAULT_BPFTOOL): $(wildcard $(BPFTOOLDIR)/*.[ch] $(BPFTOOLDIR)/Makefile)    \
+ 		    $(HOST_BPFOBJ) | $(HOST_BUILD_DIR)/bpftool
+ 	$(Q)$(MAKE) $(submake_extras)  -C $(BPFTOOLDIR)			       \
diff --git a/ci/diffs/0199-iov_iter-fix-advancing-slot-in-iter_folioq_get_pages.patch b/ci/diffs/0199-iov_iter-fix-advancing-slot-in-iter_folioq_get_pages.patch
new file mode 100644
index 0000000000000..b81d22a35322c
--- /dev/null
+++ b/ci/diffs/0199-iov_iter-fix-advancing-slot-in-iter_folioq_get_pages.patch
@@ -0,0 +1,46 @@
+From 0d24852bd71ec85ca0016b6d6fc997e6a3381552 Mon Sep 17 00:00:00 2001
+From: Omar Sandoval <osandov@fb.com>
+Date: Mon, 30 Sep 2024 11:55:00 -0700
+Subject: [PATCH] iov_iter: fix advancing slot in iter_folioq_get_pages()
+
+iter_folioq_get_pages() decides to advance to the next folioq slot when
+it has reached the end of the current folio. However, it is checking
+offset, which is the beginning of the current part, instead of
+iov_offset, which is adjusted to the end of the current part, so it
+doesn't advance the slot when it's supposed to. As a result, on the next
+iteration, we'll use the same folio with an out-of-bounds offset and
+return an unrelated page.
+
+This manifested as various crashes and other failures in 9pfs in drgn's
+VM testing setup and BPF CI.
+
+Fixes: db0aa2e9566f ("mm: Define struct folio_queue and ITER_FOLIOQ to handle a sequence of folios")
+Link: https://lore.kernel.org/linux-fsdevel/20240923183432.1876750-1-chantr4@gmail.com/
+Tested-by: Manu Bretelle <chantr4@gmail.com>
+Signed-off-by: Omar Sandoval <osandov@fb.com>
+Link: https://lore.kernel.org/r/cbaf141ba6c0e2e209717d02746584072844841a.1727722269.git.osandov@fb.com
+Tested-by: Eduard Zingerman <eddyz87@gmail.com>
+Tested-by: Leon Romanovsky <leon@kernel.org>
+Tested-by: Joey Gouly <joey.gouly@arm.com>
+Acked-by: David Howells <dhowells@redhat.com>
+Signed-off-by: Christian Brauner <brauner@kernel.org>
+---
+ lib/iov_iter.c | 2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+diff --git a/lib/iov_iter.c b/lib/iov_iter.c
+index 97003155b..1abb32c0d 100644
+--- a/lib/iov_iter.c
++++ b/lib/iov_iter.c
+@@ -1033,7 +1033,7 @@ static ssize_t iter_folioq_get_pages(struct iov_iter *iter,
+ 		if (maxpages == 0 || extracted >= maxsize)
+ 			break;
+ 
+-		if (offset >= fsize) {
++		if (iov_offset >= fsize) {
+ 			iov_offset = 0;
+ 			slot++;
+ 			if (slot == folioq_nr_slots(folioq) && folioq->next) {
+-- 
+2.34.1
+
diff --git a/ci/diffs/0299-selftests-bpf-Fix-uprobe-consumer-test.patch b/ci/diffs/0299-selftests-bpf-Fix-uprobe-consumer-test.patch
new file mode 100644
index 0000000000000..11aa3626f5a81
--- /dev/null
+++ b/ci/diffs/0299-selftests-bpf-Fix-uprobe-consumer-test.patch
@@ -0,0 +1,58 @@
+From affb32e4f056883f285f8535b766293b85752fb4 Mon Sep 17 00:00:00 2001
+From: Jiri Olsa <jolsa@kernel.org>
+Date: Tue, 24 Sep 2024 13:07:30 +0200
+Subject: [PATCH] selftests/bpf: Fix uprobe consumer test
+
+With newly merged code the uprobe behaviour is slightly different
+and affects uprobe consumer test.
+
+We no longer need to check if the uprobe object is still preserved
+after removing last uretprobe, because it stays as long as there's
+pending/installed uretprobe instance.
+
+This allows to run uretprobe consumers registered 'after' uprobe was
+hit even if previous uretprobe got unregistered before being hit.
+
+The uprobe object will be now removed after the last uprobe ref is
+released and in such case it's held by ri->uprobe (return instance)
+which is released after the uretprobe is hit.
+
+Reported-by: Ihor Solodrai <ihor.solodrai@pm.me>
+Signed-off-by: Jiri Olsa <jolsa@kernel.org>
+Signed-off-by: Daniel Borkmann <daniel@iogearbox.net>
+Tested-by: Ihor Solodrai <ihor.solodrai@pm.me>
+Closes: https://lore.kernel.org/bpf/w6U8Z9fdhjnkSp2UaFaV1fGqJXvfLEtDKEUyGDkwmoruDJ_AgF_c0FFhrkeKW18OqiP-05s9yDKiT6X-Ns-avN_ABf0dcUkXqbSJN1TQSXo=@pm.me/
+---
+ .../testing/selftests/bpf/prog_tests/uprobe_multi_test.c | 9 +--------
+ 1 file changed, 1 insertion(+), 8 deletions(-)
+
+diff --git a/tools/testing/selftests/bpf/prog_tests/uprobe_multi_test.c b/tools/testing/selftests/bpf/prog_tests/uprobe_multi_test.c
+index 844f6fc8487b..c1ac813ff9ba 100644
+--- a/tools/testing/selftests/bpf/prog_tests/uprobe_multi_test.c
++++ b/tools/testing/selftests/bpf/prog_tests/uprobe_multi_test.c
+@@ -869,21 +869,14 @@ static void consumer_test(struct uprobe_multi_consumers *skel,
+ 			fmt = "prog 0/1: uprobe";
+ 		} else {
+ 			/*
+-			 * uprobe return is tricky ;-)
+-			 *
+ 			 * to trigger uretprobe consumer, the uretprobe needs to be installed,
+ 			 * which means one of the 'return' uprobes was alive when probe was hit:
+ 			 *
+ 			 *   idxs: 2/3 uprobe return in 'installed' mask
+-			 *
+-			 * in addition if 'after' state removes everything that was installed in
+-			 * 'before' state, then uprobe kernel object goes away and return uprobe
+-			 * is not installed and we won't hit it even if it's in 'after' state.
+ 			 */
+ 			unsigned long had_uretprobes  = before & 0b1100; /* is uretprobe installed */
+-			unsigned long probe_preserved = before & after;  /* did uprobe go away */
+ 
+-			if (had_uretprobes && probe_preserved && test_bit(idx, after))
++			if (had_uretprobes && test_bit(idx, after))
+ 				val++;
+ 			fmt = "idx 2/3: uretprobe";
+ 		}
+-- 
+2.34.1
+
diff --git a/ci/diffs/0399-selftests-sched_ext-fix-build-after-renames-in-sched.patch b/ci/diffs/0399-selftests-sched_ext-fix-build-after-renames-in-sched.patch
new file mode 100644
index 0000000000000..ba37429396236
--- /dev/null
+++ b/ci/diffs/0399-selftests-sched_ext-fix-build-after-renames-in-sched.patch
@@ -0,0 +1,231 @@
+From 5565144e82b97c5d2082ab19866836dfe5b2e592 Mon Sep 17 00:00:00 2001
+From: Ihor Solodrai <ihor.solodrai@pm.me>
+Date: Thu, 21 Nov 2024 13:20:46 -0800
+Subject: [PATCH] selftests/sched_ext: fix build after renames in sched_ext API
+
+The selftests are falining to build on current tip of bpf-next and
+sched_ext [1]. This has broken BPF CI [2] after merge from upstream.
+
+Use appropriate function names in the selftests according to the
+recent changes in the sched_ext API [3].
+
+[1]
+https://git.kernel.org/pub/scm/linux/kernel/git/bpf/bpf-next.git/commit/?id=fc39fb56917bb3cb53e99560ca3612a84456ada2
+[2] https://github.com/kernel-patches/bpf/actions/runs/11959327258/job/33340923745
+[3] https://lore.kernel.org/all/20241109194853.580310-1-tj@kernel.org/
+
+Signed-off-by: Ihor Solodrai <ihor.solodrai@pm.me>
+---
+ .../testing/selftests/sched_ext/ddsp_bogus_dsq_fail.bpf.c | 2 +-
+ .../selftests/sched_ext/ddsp_vtimelocal_fail.bpf.c        | 4 ++--
+ tools/testing/selftests/sched_ext/dsp_local_on.bpf.c      | 2 +-
+ .../selftests/sched_ext/enq_select_cpu_fails.bpf.c        | 2 +-
+ tools/testing/selftests/sched_ext/exit.bpf.c              | 4 ++--
+ tools/testing/selftests/sched_ext/maximal.bpf.c           | 4 ++--
+ tools/testing/selftests/sched_ext/select_cpu_dfl.bpf.c    | 2 +-
+ .../selftests/sched_ext/select_cpu_dfl_nodispatch.bpf.c   | 2 +-
+ .../testing/selftests/sched_ext/select_cpu_dispatch.bpf.c | 2 +-
+ .../selftests/sched_ext/select_cpu_dispatch_bad_dsq.bpf.c | 2 +-
+ .../selftests/sched_ext/select_cpu_dispatch_dbl_dsp.bpf.c | 4 ++--
+ tools/testing/selftests/sched_ext/select_cpu_vtime.bpf.c  | 8 ++++----
+ 12 files changed, 19 insertions(+), 19 deletions(-)
+
+diff --git a/tools/testing/selftests/sched_ext/ddsp_bogus_dsq_fail.bpf.c b/tools/testing/selftests/sched_ext/ddsp_bogus_dsq_fail.bpf.c
+index 37d9bf6fb745..6f4c3f5a1c5d 100644
+--- a/tools/testing/selftests/sched_ext/ddsp_bogus_dsq_fail.bpf.c
++++ b/tools/testing/selftests/sched_ext/ddsp_bogus_dsq_fail.bpf.c
+@@ -20,7 +20,7 @@ s32 BPF_STRUCT_OPS(ddsp_bogus_dsq_fail_select_cpu, struct task_struct *p,
+ 		 * If we dispatch to a bogus DSQ that will fall back to the
+ 		 * builtin global DSQ, we fail gracefully.
+ 		 */
+-		scx_bpf_dispatch_vtime(p, 0xcafef00d, SCX_SLICE_DFL,
++		scx_bpf_dsq_insert_vtime(p, 0xcafef00d, SCX_SLICE_DFL,
+ 				       p->scx.dsq_vtime, 0);
+ 		return cpu;
+ 	}
+diff --git a/tools/testing/selftests/sched_ext/ddsp_vtimelocal_fail.bpf.c b/tools/testing/selftests/sched_ext/ddsp_vtimelocal_fail.bpf.c
+index dffc97d9cdf1..e4a55027778f 100644
+--- a/tools/testing/selftests/sched_ext/ddsp_vtimelocal_fail.bpf.c
++++ b/tools/testing/selftests/sched_ext/ddsp_vtimelocal_fail.bpf.c
+@@ -17,8 +17,8 @@ s32 BPF_STRUCT_OPS(ddsp_vtimelocal_fail_select_cpu, struct task_struct *p,
+ 
+ 	if (cpu >= 0) {
+ 		/* Shouldn't be allowed to vtime dispatch to a builtin DSQ. */
+-		scx_bpf_dispatch_vtime(p, SCX_DSQ_LOCAL, SCX_SLICE_DFL,
+-				       p->scx.dsq_vtime, 0);
++		scx_bpf_dsq_insert_vtime(p, SCX_DSQ_LOCAL, SCX_SLICE_DFL,
++					 p->scx.dsq_vtime, 0);
+ 		return cpu;
+ 	}
+ 
+diff --git a/tools/testing/selftests/sched_ext/dsp_local_on.bpf.c b/tools/testing/selftests/sched_ext/dsp_local_on.bpf.c
+index 6a7db1502c29..6325bf76f47e 100644
+--- a/tools/testing/selftests/sched_ext/dsp_local_on.bpf.c
++++ b/tools/testing/selftests/sched_ext/dsp_local_on.bpf.c
+@@ -45,7 +45,7 @@ void BPF_STRUCT_OPS(dsp_local_on_dispatch, s32 cpu, struct task_struct *prev)
+ 
+ 	target = bpf_get_prandom_u32() % nr_cpus;
+ 
+-	scx_bpf_dispatch(p, SCX_DSQ_LOCAL_ON | target, SCX_SLICE_DFL, 0);
++	scx_bpf_dsq_insert(p, SCX_DSQ_LOCAL_ON | target, SCX_SLICE_DFL, 0);
+ 	bpf_task_release(p);
+ }
+ 
+diff --git a/tools/testing/selftests/sched_ext/enq_select_cpu_fails.bpf.c b/tools/testing/selftests/sched_ext/enq_select_cpu_fails.bpf.c
+index 1efb50d61040..a7cf868d5e31 100644
+--- a/tools/testing/selftests/sched_ext/enq_select_cpu_fails.bpf.c
++++ b/tools/testing/selftests/sched_ext/enq_select_cpu_fails.bpf.c
+@@ -31,7 +31,7 @@ void BPF_STRUCT_OPS(enq_select_cpu_fails_enqueue, struct task_struct *p,
+ 	/* Can only call from ops.select_cpu() */
+ 	scx_bpf_select_cpu_dfl(p, 0, 0, &found);
+ 
+-	scx_bpf_dispatch(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, enq_flags);
++	scx_bpf_dsq_insert(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, enq_flags);
+ }
+ 
+ SEC(".struct_ops.link")
+diff --git a/tools/testing/selftests/sched_ext/exit.bpf.c b/tools/testing/selftests/sched_ext/exit.bpf.c
+index d75d4faf07f6..4bc36182d3ff 100644
+--- a/tools/testing/selftests/sched_ext/exit.bpf.c
++++ b/tools/testing/selftests/sched_ext/exit.bpf.c
+@@ -33,7 +33,7 @@ void BPF_STRUCT_OPS(exit_enqueue, struct task_struct *p, u64 enq_flags)
+ 	if (exit_point == EXIT_ENQUEUE)
+ 		EXIT_CLEANLY();
+ 
+-	scx_bpf_dispatch(p, DSQ_ID, SCX_SLICE_DFL, enq_flags);
++	scx_bpf_dsq_insert(p, DSQ_ID, SCX_SLICE_DFL, enq_flags);
+ }
+ 
+ void BPF_STRUCT_OPS(exit_dispatch, s32 cpu, struct task_struct *p)
+@@ -41,7 +41,7 @@ void BPF_STRUCT_OPS(exit_dispatch, s32 cpu, struct task_struct *p)
+ 	if (exit_point == EXIT_DISPATCH)
+ 		EXIT_CLEANLY();
+ 
+-	scx_bpf_consume(DSQ_ID);
++	scx_bpf_dsq_move_to_local(DSQ_ID);
+ }
+ 
+ void BPF_STRUCT_OPS(exit_enable, struct task_struct *p)
+diff --git a/tools/testing/selftests/sched_ext/maximal.bpf.c b/tools/testing/selftests/sched_ext/maximal.bpf.c
+index 4d4cd8d966db..4c005fa71810 100644
+--- a/tools/testing/selftests/sched_ext/maximal.bpf.c
++++ b/tools/testing/selftests/sched_ext/maximal.bpf.c
+@@ -20,7 +20,7 @@ s32 BPF_STRUCT_OPS(maximal_select_cpu, struct task_struct *p, s32 prev_cpu,
+ 
+ void BPF_STRUCT_OPS(maximal_enqueue, struct task_struct *p, u64 enq_flags)
+ {
+-	scx_bpf_dispatch(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, enq_flags);
++	scx_bpf_dsq_insert(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, enq_flags);
+ }
+ 
+ void BPF_STRUCT_OPS(maximal_dequeue, struct task_struct *p, u64 deq_flags)
+@@ -28,7 +28,7 @@ void BPF_STRUCT_OPS(maximal_dequeue, struct task_struct *p, u64 deq_flags)
+ 
+ void BPF_STRUCT_OPS(maximal_dispatch, s32 cpu, struct task_struct *prev)
+ {
+-	scx_bpf_consume(SCX_DSQ_GLOBAL);
++	scx_bpf_dsq_move_to_local(SCX_DSQ_GLOBAL);
+ }
+ 
+ void BPF_STRUCT_OPS(maximal_runnable, struct task_struct *p, u64 enq_flags)
+diff --git a/tools/testing/selftests/sched_ext/select_cpu_dfl.bpf.c b/tools/testing/selftests/sched_ext/select_cpu_dfl.bpf.c
+index f171ac470970..13d0f5be788d 100644
+--- a/tools/testing/selftests/sched_ext/select_cpu_dfl.bpf.c
++++ b/tools/testing/selftests/sched_ext/select_cpu_dfl.bpf.c
+@@ -30,7 +30,7 @@ void BPF_STRUCT_OPS(select_cpu_dfl_enqueue, struct task_struct *p,
+ 	}
+ 	scx_bpf_put_idle_cpumask(idle_mask);
+ 
+-	scx_bpf_dispatch(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, enq_flags);
++	scx_bpf_dsq_insert(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, enq_flags);
+ }
+ 
+ SEC(".struct_ops.link")
+diff --git a/tools/testing/selftests/sched_ext/select_cpu_dfl_nodispatch.bpf.c b/tools/testing/selftests/sched_ext/select_cpu_dfl_nodispatch.bpf.c
+index 9efdbb7da928..815f1d5d61ac 100644
+--- a/tools/testing/selftests/sched_ext/select_cpu_dfl_nodispatch.bpf.c
++++ b/tools/testing/selftests/sched_ext/select_cpu_dfl_nodispatch.bpf.c
+@@ -67,7 +67,7 @@ void BPF_STRUCT_OPS(select_cpu_dfl_nodispatch_enqueue, struct task_struct *p,
+ 		saw_local = true;
+ 	}
+ 
+-	scx_bpf_dispatch(p, dsq_id, SCX_SLICE_DFL, enq_flags);
++	scx_bpf_dsq_insert(p, dsq_id, SCX_SLICE_DFL, enq_flags);
+ }
+ 
+ s32 BPF_STRUCT_OPS(select_cpu_dfl_nodispatch_init_task,
+diff --git a/tools/testing/selftests/sched_ext/select_cpu_dispatch.bpf.c b/tools/testing/selftests/sched_ext/select_cpu_dispatch.bpf.c
+index 59bfc4f36167..4bb99699e920 100644
+--- a/tools/testing/selftests/sched_ext/select_cpu_dispatch.bpf.c
++++ b/tools/testing/selftests/sched_ext/select_cpu_dispatch.bpf.c
+@@ -29,7 +29,7 @@ s32 BPF_STRUCT_OPS(select_cpu_dispatch_select_cpu, struct task_struct *p,
+ 	cpu = prev_cpu;
+ 
+ dispatch:
+-	scx_bpf_dispatch(p, dsq_id, SCX_SLICE_DFL, 0);
++	scx_bpf_dsq_insert(p, dsq_id, SCX_SLICE_DFL, 0);
+ 	return cpu;
+ }
+ 
+diff --git a/tools/testing/selftests/sched_ext/select_cpu_dispatch_bad_dsq.bpf.c b/tools/testing/selftests/sched_ext/select_cpu_dispatch_bad_dsq.bpf.c
+index 3bbd5fcdfb18..2a75de11b2cf 100644
+--- a/tools/testing/selftests/sched_ext/select_cpu_dispatch_bad_dsq.bpf.c
++++ b/tools/testing/selftests/sched_ext/select_cpu_dispatch_bad_dsq.bpf.c
+@@ -18,7 +18,7 @@ s32 BPF_STRUCT_OPS(select_cpu_dispatch_bad_dsq_select_cpu, struct task_struct *p
+ 		   s32 prev_cpu, u64 wake_flags)
+ {
+ 	/* Dispatching to a random DSQ should fail. */
+-	scx_bpf_dispatch(p, 0xcafef00d, SCX_SLICE_DFL, 0);
++	scx_bpf_dsq_insert(p, 0xcafef00d, SCX_SLICE_DFL, 0);
+ 
+ 	return prev_cpu;
+ }
+diff --git a/tools/testing/selftests/sched_ext/select_cpu_dispatch_dbl_dsp.bpf.c b/tools/testing/selftests/sched_ext/select_cpu_dispatch_dbl_dsp.bpf.c
+index 0fda57fe0ecf..99d075695c97 100644
+--- a/tools/testing/selftests/sched_ext/select_cpu_dispatch_dbl_dsp.bpf.c
++++ b/tools/testing/selftests/sched_ext/select_cpu_dispatch_dbl_dsp.bpf.c
+@@ -18,8 +18,8 @@ s32 BPF_STRUCT_OPS(select_cpu_dispatch_dbl_dsp_select_cpu, struct task_struct *p
+ 		   s32 prev_cpu, u64 wake_flags)
+ {
+ 	/* Dispatching twice in a row is disallowed. */
+-	scx_bpf_dispatch(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, 0);
+-	scx_bpf_dispatch(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, 0);
++	scx_bpf_dsq_insert(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, 0);
++	scx_bpf_dsq_insert(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, 0);
+ 
+ 	return prev_cpu;
+ }
+diff --git a/tools/testing/selftests/sched_ext/select_cpu_vtime.bpf.c b/tools/testing/selftests/sched_ext/select_cpu_vtime.bpf.c
+index e6c67bcf5e6e..bfcb96cd4954 100644
+--- a/tools/testing/selftests/sched_ext/select_cpu_vtime.bpf.c
++++ b/tools/testing/selftests/sched_ext/select_cpu_vtime.bpf.c
+@@ -2,8 +2,8 @@
+ /*
+  * A scheduler that validates that enqueue flags are properly stored and
+  * applied at dispatch time when a task is directly dispatched from
+- * ops.select_cpu(). We validate this by using scx_bpf_dispatch_vtime(), and
+- * making the test a very basic vtime scheduler.
++ * ops.select_cpu(). We validate this by using scx_bpf_dsq_insert_vtime(),
++ * and making the test a very basic vtime scheduler.
+  *
+  * Copyright (c) 2024 Meta Platforms, Inc. and affiliates.
+  * Copyright (c) 2024 David Vernet <dvernet@meta.com>
+@@ -47,13 +47,13 @@ s32 BPF_STRUCT_OPS(select_cpu_vtime_select_cpu, struct task_struct *p,
+ 	cpu = prev_cpu;
+ 	scx_bpf_test_and_clear_cpu_idle(cpu);
+ ddsp:
+-	scx_bpf_dispatch_vtime(p, VTIME_DSQ, SCX_SLICE_DFL, task_vtime(p), 0);
++	scx_bpf_dsq_insert_vtime(p, VTIME_DSQ, SCX_SLICE_DFL, task_vtime(p), 0);
+ 	return cpu;
+ }
+ 
+ void BPF_STRUCT_OPS(select_cpu_vtime_dispatch, s32 cpu, struct task_struct *p)
+ {
+-	if (scx_bpf_consume(VTIME_DSQ))
++	if (scx_bpf_dsq_move_to_local(VTIME_DSQ))
+ 		consumed = true;
+ }
+ 
+-- 
+2.47.0
+
diff --git a/ci/diffs/0499-samples-bpf-fix-samples-compilation.patch b/ci/diffs/0499-samples-bpf-fix-samples-compilation.patch
new file mode 100644
index 0000000000000..1f95c3c237cb9
--- /dev/null
+++ b/ci/diffs/0499-samples-bpf-fix-samples-compilation.patch
@@ -0,0 +1,61 @@
+From 80a5958a52b86e39c1a1bf5f4702011c0cf6ab4f Mon Sep 17 00:00:00 2001
+From: Eduard Zingerman <eddyz87@gmail.com>
+Date: Mon, 2 Dec 2024 12:14:46 -0800
+Subject: [PATCH] samples/bpf: fix samples compilation
+
+Commit [0] breaks samples build.
+
+TODO: moar details here
+
+[0] 13b25489b6f8 ("kbuild: change working directory to external module directory with M=")
+
+Signed-off-by: Eduard Zingerman <eddyz87@gmail.com>
+Signed-off-by: Ihor Solodrai <ihor.solodrai@pm.me>
+---
+ samples/bpf/Makefile | 13 +++++++------
+ 1 file changed, 7 insertions(+), 6 deletions(-)
+
+diff --git a/samples/bpf/Makefile b/samples/bpf/Makefile
+index bcf103a4c14f..ee10dbf1b471 100644
+--- a/samples/bpf/Makefile
++++ b/samples/bpf/Makefile
+@@ -146,13 +146,14 @@ ifeq ($(ARCH), x86)
+ BPF_EXTRA_CFLAGS += -fcf-protection
+ endif
+ 
+-TPROGS_CFLAGS += -Wall -O2
+-TPROGS_CFLAGS += -Wmissing-prototypes
+-TPROGS_CFLAGS += -Wstrict-prototypes
+-TPROGS_CFLAGS += $(call try-run,\
++COMMON_CFLAGS += -Wall -O2
++COMMON_CFLAGS += -Wmissing-prototypes
++COMMON_CFLAGS += -Wstrict-prototypes
++COMMON_CFLAGS += $(call try-run,\
+ 	printf "int main() { return 0; }" |\
+ 	$(CC) -Werror -fsanitize=bounds -x c - -o "$$TMP",-fsanitize=bounds,)
+ 
++TPROGS_CFLAGS += $(COMMON_CFLAGS)
+ TPROGS_CFLAGS += -I$(objtree)/usr/include
+ TPROGS_CFLAGS += -I$(srctree)/tools/testing/selftests/bpf/
+ TPROGS_CFLAGS += -I$(LIBBPF_INCLUDE)
+@@ -229,7 +230,7 @@ clean:
+ 
+ $(LIBBPF): $(wildcard $(LIBBPF_SRC)/*.[ch] $(LIBBPF_SRC)/Makefile) | $(LIBBPF_OUTPUT)
+ # Fix up variables inherited from Kbuild that tools/ build system won't like
+-	$(MAKE) -C $(LIBBPF_SRC) RM='rm -rf' EXTRA_CFLAGS="$(TPROGS_CFLAGS)" \
++	$(MAKE) -C $(LIBBPF_SRC) RM='rm -rf' EXTRA_CFLAGS="$(COMMON_CFLAGS)" \
+ 		LDFLAGS="$(TPROGS_LDFLAGS)" srctree=$(BPF_SAMPLES_PATH)/../../ \
+ 		O= OUTPUT=$(LIBBPF_OUTPUT)/ DESTDIR=$(LIBBPF_DESTDIR) prefix= \
+ 		$@ install_headers
+@@ -305,7 +306,7 @@ $(obj)/$(TRACE_HELPERS): TPROGS_CFLAGS := $(TPROGS_CFLAGS) -D__must_check=
+ -include $(BPF_SAMPLES_PATH)/Makefile.target
+ 
+ VMLINUX_BTF_PATHS ?= $(abspath $(if $(O),$(O)/vmlinux))				\
+-		     $(abspath $(if $(KBUILD_OUTPUT),$(KBUILD_OUTPUT)/vmlinux))	\
++		     $(abspath $(if $(objtree),$(objtree)/vmlinux))		\
+ 		     $(abspath ./vmlinux)
+ VMLINUX_BTF ?= $(abspath $(firstword $(wildcard $(VMLINUX_BTF_PATHS))))
+ 
+-- 
+2.47.0
+
diff --git a/ci/diffs/2000-s390-fgraph-Fix-to-remove-ftrace_test_recursion_tryl.patch b/ci/diffs/2000-s390-fgraph-Fix-to-remove-ftrace_test_recursion_tryl.patch
new file mode 100644
index 0000000000000..7e38b1a151a10
--- /dev/null
+++ b/ci/diffs/2000-s390-fgraph-Fix-to-remove-ftrace_test_recursion_tryl.patch
@@ -0,0 +1,46 @@
+From faf291ff4beaef8dedebd166f11f815cdee257dc Mon Sep 17 00:00:00 2001
+From: "Masami Hiramatsu (Google)" <mhiramat@kernel.org>
+Date: Wed, 29 Jan 2025 00:29:37 +0900
+Subject: [PATCH 2000/2001] s390: fgraph: Fix to remove
+ ftrace_test_recursion_trylock()
+
+Fix to remove ftrace_test_recursion_trylock() from ftrace_graph_func()
+because commit d576aec24df9 ("fgraph: Get ftrace recursion lock in
+function_graph_enter") has been moved it to function_graph_enter_regs()
+already.
+
+Reported-by: Jiri Olsa <olsajiri@gmail.com>
+Closes: https://lore.kernel.org/all/Z5O0shrdgeExZ2kF@krava/
+Fixes: d576aec24df9 ("fgraph: Get ftrace recursion lock in function_graph_enter")
+Signed-off-by: Masami Hiramatsu (Google) <mhiramat@kernel.org>
+Tested-by: Jiri Olsa <jolsa@kernel.org>
+---
+ arch/s390/kernel/ftrace.c | 5 -----
+ 1 file changed, 5 deletions(-)
+
+diff --git a/arch/s390/kernel/ftrace.c b/arch/s390/kernel/ftrace.c
+index c0b2c97efefb..63ba6306632e 100644
+--- a/arch/s390/kernel/ftrace.c
++++ b/arch/s390/kernel/ftrace.c
+@@ -266,18 +266,13 @@ void ftrace_graph_func(unsigned long ip, unsigned long parent_ip,
+ 		       struct ftrace_ops *op, struct ftrace_regs *fregs)
+ {
+ 	unsigned long *parent = &arch_ftrace_regs(fregs)->regs.gprs[14];
+-	int bit;
+ 
+ 	if (unlikely(ftrace_graph_is_dead()))
+ 		return;
+ 	if (unlikely(atomic_read(&current->tracing_graph_pause)))
+ 		return;
+-	bit = ftrace_test_recursion_trylock(ip, *parent);
+-	if (bit < 0)
+-		return;
+ 	if (!function_graph_enter_regs(*parent, ip, 0, parent, fregs))
+ 		*parent = (unsigned long)&return_to_handler;
+-	ftrace_test_recursion_unlock(bit);
+ }
+ 
+ #endif /* CONFIG_FUNCTION_GRAPH_TRACER */
+-- 
+2.48.1
+
diff --git a/ci/diffs/2001-s390-tracing-Define-ftrace_get_symaddr-for-s390.patch b/ci/diffs/2001-s390-tracing-Define-ftrace_get_symaddr-for-s390.patch
new file mode 100644
index 0000000000000..66483206f448f
--- /dev/null
+++ b/ci/diffs/2001-s390-tracing-Define-ftrace_get_symaddr-for-s390.patch
@@ -0,0 +1,28 @@
+From 04fce0d606f59a62105729094013c4784492ec7b Mon Sep 17 00:00:00 2001
+From: "Masami Hiramatsu (Google)" <mhiramat@kernel.org>
+Date: Wed, 29 Jan 2025 00:29:48 +0900
+Subject: [PATCH 2001/2001] s390: tracing: Define ftrace_get_symaddr() for s390
+
+Add ftrace_get_symaddr() for s390, which returns the symbol address
+from ftrace's 'ip' parameter.
+
+Signed-off-by: Masami Hiramatsu (Google) <mhiramat@kernel.org>
+---
+ arch/s390/include/asm/ftrace.h | 1 +
+ 1 file changed, 1 insertion(+)
+
+diff --git a/arch/s390/include/asm/ftrace.h b/arch/s390/include/asm/ftrace.h
+index a3b73a4f626e..185331e91f83 100644
+--- a/arch/s390/include/asm/ftrace.h
++++ b/arch/s390/include/asm/ftrace.h
+@@ -51,6 +51,7 @@ static inline unsigned long ftrace_call_adjust(unsigned long addr)
+ {
+ 	return addr;
+ }
++#define ftrace_get_symaddr(fentry_ip) ((unsigned long)(fentry_ip))
+ 
+ #include <linux/ftrace_regs.h>
+ 
+-- 
+2.48.1
+
diff --git a/ci/diffs/2001-selftests-bpf-add-fno-strict-aliasing-to-BPF_CFLAGS.patch b/ci/diffs/2001-selftests-bpf-add-fno-strict-aliasing-to-BPF_CFLAGS.patch
new file mode 100644
index 0000000000000..9b24de70e2846
--- /dev/null
+++ b/ci/diffs/2001-selftests-bpf-add-fno-strict-aliasing-to-BPF_CFLAGS.patch
@@ -0,0 +1,75 @@
+From f44275e7155dc310d36516fc25be503da099781c Mon Sep 17 00:00:00 2001
+From: Ihor Solodrai <ihor.solodrai@pm.me>
+Date: Mon, 6 Jan 2025 20:17:31 +0000
+Subject: [PATCH] selftests/bpf: add -fno-strict-aliasing to BPF_CFLAGS
+
+Following the discussion at [1], set -fno-strict-aliasing flag for all
+BPF object build rules. Remove now unnecessary <test>-CFLAGS variables.
+
+[1] https://lore.kernel.org/bpf/20250106185447.951609-1-ihor.solodrai@pm.me/
+
+CC: Jose E. Marchesi <jose.marchesi@oracle.com>
+Signed-off-by: Ihor Solodrai <ihor.solodrai@pm.me>
+Acked-by: Eduard Zingerman <eddyz87@gmail.com>
+Link: https://lore.kernel.org/r/20250106201728.1219791-1-ihor.solodrai@pm.me
+Signed-off-by: Alexei Starovoitov <ast@kernel.org>
+---
+ tools/testing/selftests/bpf/Makefile | 28 +---------------------------
+ 1 file changed, 1 insertion(+), 27 deletions(-)
+
+diff --git a/tools/testing/selftests/bpf/Makefile b/tools/testing/selftests/bpf/Makefile
+index eb4d21651aa7..d5be2f94deef 100644
+--- a/tools/testing/selftests/bpf/Makefile
++++ b/tools/testing/selftests/bpf/Makefile
+@@ -54,21 +54,6 @@ PCAP_LIBS	:= $(shell $(PKG_CONFIG) --libs libpcap 2>/dev/null)
+ LDLIBS += $(PCAP_LIBS)
+ CFLAGS += $(PCAP_CFLAGS)
+ 
+-# The following tests perform type punning and they may break strict
+-# aliasing rules, which are exploited by both GCC and clang by default
+-# while optimizing.  This can lead to broken programs.
+-progs/bind4_prog.c-CFLAGS := -fno-strict-aliasing
+-progs/bind6_prog.c-CFLAGS := -fno-strict-aliasing
+-progs/dynptr_fail.c-CFLAGS := -fno-strict-aliasing
+-progs/linked_list_fail.c-CFLAGS := -fno-strict-aliasing
+-progs/map_kptr_fail.c-CFLAGS := -fno-strict-aliasing
+-progs/syscall.c-CFLAGS := -fno-strict-aliasing
+-progs/test_pkt_md_access.c-CFLAGS := -fno-strict-aliasing
+-progs/test_sk_lookup.c-CFLAGS := -fno-strict-aliasing
+-progs/timer_crash.c-CFLAGS := -fno-strict-aliasing
+-progs/test_global_func9.c-CFLAGS := -fno-strict-aliasing
+-progs/verifier_nocsr.c-CFLAGS := -fno-strict-aliasing
+-
+ # Some utility functions use LLVM libraries
+ jit_disasm_helpers.c-CFLAGS = $(LLVM_CFLAGS)
+ 
+@@ -103,18 +88,6 @@ progs/btf_dump_test_case_packing.c-bpf_gcc-CFLAGS := -Wno-error
+ progs/btf_dump_test_case_padding.c-bpf_gcc-CFLAGS := -Wno-error
+ progs/btf_dump_test_case_syntax.c-bpf_gcc-CFLAGS := -Wno-error
+ 
+-# The following tests do type-punning, via the __imm_insn macro, from
+-# `struct bpf_insn' to long and then uses the value.  This triggers an
+-# "is used uninitialized" warning in GCC due to strict-aliasing
+-# rules.
+-progs/verifier_ref_tracking.c-bpf_gcc-CFLAGS := -fno-strict-aliasing
+-progs/verifier_unpriv.c-bpf_gcc-CFLAGS := -fno-strict-aliasing
+-progs/verifier_cgroup_storage.c-bpf_gcc-CFLAGS := -fno-strict-aliasing
+-progs/verifier_ld_ind.c-bpf_gcc-CFLAGS := -fno-strict-aliasing
+-progs/verifier_map_ret_val.c-bpf_gcc-CFLAGS := -fno-strict-aliasing
+-progs/verifier_spill_fill.c-bpf_gcc-CFLAGS := -fno-strict-aliasing
+-progs/verifier_subprog_precision.c-bpf_gcc-CFLAGS := -fno-strict-aliasing
+-progs/verifier_uninit.c-bpf_gcc-CFLAGS := -fno-strict-aliasing
+ endif
+ 
+ ifneq ($(CLANG_CPUV4),)
+@@ -474,6 +447,7 @@ CLANG_SYS_INCLUDES = $(call get_sys_includes,$(CLANG),$(CLANG_TARGET_ARCH))
+ BPF_CFLAGS = -g -Wall -Werror -D__TARGET_ARCH_$(SRCARCH) $(MENDIAN)	\
+ 	     -I$(INCLUDE_DIR) -I$(CURDIR) -I$(APIDIR)			\
+ 	     -I$(abspath $(OUTPUT)/../usr/include)			\
++	     -fno-strict-aliasing 					\
+ 	     -Wno-compare-distinct-pointer-types
+ # TODO: enable me -Wsign-compare
+ 
+-- 
+2.47.1
+
diff --git a/ci/diffs/2002-selftests-bpf-add-std-gnu11-to-BPF_CFLAGS-and-CFLAGS.patch b/ci/diffs/2002-selftests-bpf-add-std-gnu11-to-BPF_CFLAGS-and-CFLAGS.patch
new file mode 100644
index 0000000000000..127b2641dc223
--- /dev/null
+++ b/ci/diffs/2002-selftests-bpf-add-std-gnu11-to-BPF_CFLAGS-and-CFLAGS.patch
@@ -0,0 +1,63 @@
+From bab18c7db44d3aa6c84450095451580922359c7a Mon Sep 17 00:00:00 2001
+From: Ihor Solodrai <ihor.solodrai@pm.me>
+Date: Tue, 7 Jan 2025 23:58:18 +0000
+Subject: [PATCH] selftests/bpf: add -std=gnu11 to BPF_CFLAGS and CFLAGS
+
+Latest versions of GCC BPF use C23 standard by default. This causes
+compilation errors in vmlinux.h due to bool types declarations.
+
+Add -std=gnu11 to BPF_CFLAGS and CFLAGS. This aligns with the version
+of the standard used when building the kernel currently [1].
+
+For more details see the discussions at [2] and [3].
+
+[1] https://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git/tree/Makefile#n465
+[2] https://lore.kernel.org/bpf/EYcXjcKDCJY7Yb0GGtAAb7nLKPEvrgWdvWpuNzXm2qi6rYMZDixKv5KwfVVMBq17V55xyC-A1wIjrqG3aw-Imqudo9q9X7D7nLU2gWgbN0w=@pm.me/
+[3] https://lore.kernel.org/bpf/20250106202715.1232864-1-ihor.solodrai@pm.me/
+
+CC: Jose E. Marchesi <jose.marchesi@oracle.com>
+Signed-off-by: Ihor Solodrai <ihor.solodrai@pm.me>
+Link: https://lore.kernel.org/r/20250107235813.2964472-1-ihor.solodrai@pm.me
+Signed-off-by: Alexei Starovoitov <ast@kernel.org>
+---
+ tools/testing/selftests/bpf/Makefile | 8 ++++++--
+ 1 file changed, 6 insertions(+), 2 deletions(-)
+
+diff --git a/tools/testing/selftests/bpf/Makefile b/tools/testing/selftests/bpf/Makefile
+index d5be2f94deef..ea9cee5de0f8 100644
+--- a/tools/testing/selftests/bpf/Makefile
++++ b/tools/testing/selftests/bpf/Makefile
+@@ -41,7 +41,7 @@ srctree := $(patsubst %/,%,$(dir $(srctree)))
+ srctree := $(patsubst %/,%,$(dir $(srctree)))
+ endif
+ 
+-CFLAGS += -g $(OPT_FLAGS) -rdynamic					\
++CFLAGS += -g $(OPT_FLAGS) -rdynamic -std=gnu11				\
+ 	  -Wall -Werror -fno-omit-frame-pointer				\
+ 	  $(GENFLAGS) $(SAN_CFLAGS) $(LIBELF_CFLAGS)			\
+ 	  -I$(CURDIR) -I$(INCLUDE_DIR) -I$(GENDIR) -I$(LIBDIR)		\
+@@ -447,6 +447,7 @@ CLANG_SYS_INCLUDES = $(call get_sys_includes,$(CLANG),$(CLANG_TARGET_ARCH))
+ BPF_CFLAGS = -g -Wall -Werror -D__TARGET_ARCH_$(SRCARCH) $(MENDIAN)	\
+ 	     -I$(INCLUDE_DIR) -I$(CURDIR) -I$(APIDIR)			\
+ 	     -I$(abspath $(OUTPUT)/../usr/include)			\
++	     -std=gnu11		 					\
+ 	     -fno-strict-aliasing 					\
+ 	     -Wno-compare-distinct-pointer-types
+ # TODO: enable me -Wsign-compare
+@@ -787,9 +788,12 @@ $(OUTPUT)/xdp_features: xdp_features.c $(OUTPUT)/network_helpers.o $(OUTPUT)/xdp
+ 	$(Q)$(CC) $(CFLAGS) $(filter %.a %.o %.c,$^) $(LDLIBS) -o $@
+ 
+ # Make sure we are able to include and link libbpf against c++.
++CXXFLAGS += $(CFLAGS)
++CXXFLAGS := $(subst -D_GNU_SOURCE=,,$(CXXFLAGS))
++CXXFLAGS := $(subst -std=gnu11,-std=gnu++11,$(CXXFLAGS))
+ $(OUTPUT)/test_cpp: test_cpp.cpp $(OUTPUT)/test_core_extern.skel.h $(BPFOBJ)
+ 	$(call msg,CXX,,$@)
+-	$(Q)$(CXX) $(subst -D_GNU_SOURCE=,,$(CFLAGS)) $(filter %.a %.o %.cpp,$^) $(LDLIBS) -o $@
++	$(Q)$(CXX) $(CXXFLAGS) $(filter %.a %.o %.cpp,$^) $(LDLIBS) -o $@
+ 
+ # Benchmark runner
+ $(OUTPUT)/bench_%.o: benchs/bench_%.c bench.h $(BPFOBJ)
+-- 
+2.47.1
+
diff --git a/ci/diffs/8888-netfs-Fix-setting-NETFS_RREQ_ALL_QUEUED-to-be-after-.patch b/ci/diffs/8888-netfs-Fix-setting-NETFS_RREQ_ALL_QUEUED-to-be-after-.patch
new file mode 100644
index 0000000000000..31bc3fb4717ec
--- /dev/null
+++ b/ci/diffs/8888-netfs-Fix-setting-NETFS_RREQ_ALL_QUEUED-to-be-after-.patch
@@ -0,0 +1,100 @@
+From a99b3ef16d4473f8f9b7547f89791d037112a7e6 Mon Sep 17 00:00:00 2001
+From: David Howells <dhowells@redhat.com>
+Date: Wed, 12 Feb 2025 22:24:01 +0000
+Subject: [PATCH] netfs: Fix setting NETFS_RREQ_ALL_QUEUED to be after all
+ subreqs queued
+
+Due to the code that queues a subreq on the active subrequest list getting
+moved to netfs_issue_read(), the NETFS_RREQ_ALL_QUEUED flag may now get set
+before the list-add actually happens.  This is not a problem if the
+collection worker happens after the list-add, but it's a race - and, for
+9P, where the read from the server is synchronous and done in the
+submitting thread, this is a lot more likely.
+
+The result is that, if the timing is wrong, a ref gets leaked because the
+collector thinks that all the subreqs have completed (because it can't see
+the last one yet) and clears NETFS_RREQ_IN_PROGRESS - at which point, the
+collection worker no longer goes into the collector.
+
+This can be provoked with AFS by injecting an msleep() right before the
+final subreq is queued.
+
+Fix this by splitting the queuing part out of netfs_issue_read() into a new
+function, netfs_queue_read(), and calling it separately.  The setting of
+NETFS_RREQ_ALL_QUEUED is then done by netfs_queue_read() whilst it is
+holding the spinlock (that's probably unnecessary, but shouldn't hurt).
+
+It might be better to set a flag on the final subreq, but this could be a
+problem if an error occurs and we can't queue it.
+
+Fixes: e2d46f2ec332 ("netfs: Change the read result collector to only use one work item")
+Reported-by: Ihor Solodrai <ihor.solodrai@pm.me>
+Closes: https://lore.kernel.org/r/a7x33d4dnMdGTtRivptq6S1i8btK70SNBP2XyX_xwDAhLvgQoPox6FVBOkifq4eBinfFfbZlIkMZBe3QarlWTxoEtHZwJCZbNKtaqrR7PvI=@pm.me/
+Signed-off-by: David Howells <dhowells@redhat.com>
+Tested-by: Ihor Solodrai <ihor.solodrai@linux.dev>
+cc: Eric Van Hensbergen <ericvh@kernel.org>
+cc: Latchesar Ionkov <lucho@ionkov.net>
+cc: Dominique Martinet <asmadeus@codewreck.org>
+cc: Christian Schoenebeck <linux_oss@crudebyte.com>
+cc: Marc Dionne <marc.dionne@auristor.com>
+cc: Steve French <stfrench@microsoft.com>
+cc: Paulo Alcantara <pc@manguebit.com>
+cc: Jeff Layton <jlayton@kernel.org>
+cc: v9fs@lists.linux.dev
+cc: linux-cifs@vger.kernel.org
+cc: netfs@lists.linux.dev
+cc: linux-fsdevel@vger.kernel.org
+---
+ fs/netfs/buffered_read.c | 19 +++++++++++++------
+ 1 file changed, 13 insertions(+), 6 deletions(-)
+
+diff --git a/fs/netfs/buffered_read.c b/fs/netfs/buffered_read.c
+index f761d44b3436..0d1b6d35ff3b 100644
+--- a/fs/netfs/buffered_read.c
++++ b/fs/netfs/buffered_read.c
+@@ -155,8 +155,9 @@ static void netfs_read_cache_to_pagecache(struct netfs_io_request *rreq,
+ 			netfs_cache_read_terminated, subreq);
+ }
+ 
+-static void netfs_issue_read(struct netfs_io_request *rreq,
+-			     struct netfs_io_subrequest *subreq)
++static void netfs_queue_read(struct netfs_io_request *rreq,
++			     struct netfs_io_subrequest *subreq,
++			     bool last_subreq)
+ {
+ 	struct netfs_io_stream *stream = &rreq->io_streams[0];
+ 
+@@ -177,8 +178,17 @@ static void netfs_issue_read(struct netfs_io_request *rreq,
+ 		}
+ 	}
+ 
++	if (last_subreq) {
++		smp_wmb(); /* Write lists before ALL_QUEUED. */
++		set_bit(NETFS_RREQ_ALL_QUEUED, &rreq->flags);
++	}
++
+ 	spin_unlock(&rreq->lock);
++}
+ 
++static void netfs_issue_read(struct netfs_io_request *rreq,
++			     struct netfs_io_subrequest *subreq)
++{
+ 	switch (subreq->source) {
+ 	case NETFS_DOWNLOAD_FROM_SERVER:
+ 		rreq->netfs_ops->issue_read(subreq);
+@@ -293,11 +303,8 @@ static void netfs_read_to_pagecache(struct netfs_io_request *rreq)
+ 		}
+ 		size -= slice;
+ 		start += slice;
+-		if (size <= 0) {
+-			smp_wmb(); /* Write lists before ALL_QUEUED. */
+-			set_bit(NETFS_RREQ_ALL_QUEUED, &rreq->flags);
+-		}
+ 
++		netfs_queue_read(rreq, subreq, size <= 0);
+ 		netfs_issue_read(rreq, subreq);
+ 		cond_resched();
+ 	} while (size > 0);
+-- 
+2.48.1
+
diff --git a/ci/diffs/9998-sched_ext-Fix-invalid-irq-restore-in-scx_ops_bypass.patch b/ci/diffs/9998-sched_ext-Fix-invalid-irq-restore-in-scx_ops_bypass.patch
new file mode 100644
index 0000000000000..0f65cb47ce2e6
--- /dev/null
+++ b/ci/diffs/9998-sched_ext-Fix-invalid-irq-restore-in-scx_ops_bypass.patch
@@ -0,0 +1,56 @@
+From 10e1d78546b3dd4ea9d773c0b0257064a99211e9 Mon Sep 17 00:00:00 2001
+From: Tejun Heo <tj@kernel.org>
+Date: Wed, 11 Dec 2024 11:01:51 -1000
+Subject: [PATCH] sched_ext: Fix invalid irq restore in scx_ops_bypass()
+
+While adding outer irqsave/restore locking, 0e7ffff1b811 ("scx: Fix raciness
+in scx_ops_bypass()") forgot to convert an inner rq_unlock_irqrestore() to
+rq_unlock() which could re-enable IRQ prematurely leading to the following
+warning:
+
+  raw_local_irq_restore() called with IRQs enabled
+  WARNING: CPU: 1 PID: 96 at kernel/locking/irqflag-debug.c:10 warn_bogus_irq_restore+0x30/0x40
+  ...
+  Sched_ext: create_dsq (enabling)
+  pstate: 60400005 (nZCv daif +PAN -UAO -TCO -DIT -SSBS BTYPE=--)
+  pc : warn_bogus_irq_restore+0x30/0x40
+  lr : warn_bogus_irq_restore+0x30/0x40
+  ...
+  Call trace:
+   warn_bogus_irq_restore+0x30/0x40 (P)
+   warn_bogus_irq_restore+0x30/0x40 (L)
+   scx_ops_bypass+0x224/0x3b8
+   scx_ops_enable.isra.0+0x2c8/0xaa8
+   bpf_scx_reg+0x18/0x30
+  ...
+  irq event stamp: 33739
+  hardirqs last  enabled at (33739): [<ffff8000800b699c>] scx_ops_bypass+0x174/0x3b8
+  hardirqs last disabled at (33738): [<ffff800080d48ad4>] _raw_spin_lock_irqsave+0xb4/0xd8
+
+Drop the stray _irqrestore().
+
+Signed-off-by: Tejun Heo <tj@kernel.org>
+Reported-by: Ihor Solodrai <ihor.solodrai@pm.me>
+Link: http://lkml.kernel.org/r/qC39k3UsonrBYD_SmuxHnZIQLsuuccoCrkiqb_BT7DvH945A1_LZwE4g-5Pu9FcCtqZt4lY1HhIPi0homRuNWxkgo1rgP3bkxa0donw8kV4=@pm.me
+Fixes: 0e7ffff1b811 ("scx: Fix raciness in scx_ops_bypass()")
+Cc: stable@vger.kernel.org # v6.12
+---
+ kernel/sched/ext.c | 2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+diff --git a/kernel/sched/ext.c b/kernel/sched/ext.c
+index 7fff1d045477..98519e6d0dcd 100644
+--- a/kernel/sched/ext.c
++++ b/kernel/sched/ext.c
+@@ -4763,7 +4763,7 @@ static void scx_ops_bypass(bool bypass)
+ 		 * sees scx_rq_bypassing() before moving tasks to SCX.
+ 		 */
+ 		if (!scx_enabled()) {
+-			rq_unlock_irqrestore(rq, &rf);
++			rq_unlock(rq, &rf);
+ 			continue;
+ 		}
+ 
+-- 
+2.47.1
+
diff --git a/ci/diffs/9999-scx-Fix-maximal-BPF-selftest-prog.patch b/ci/diffs/9999-scx-Fix-maximal-BPF-selftest-prog.patch
new file mode 100644
index 0000000000000..9b5e6d50778e1
--- /dev/null
+++ b/ci/diffs/9999-scx-Fix-maximal-BPF-selftest-prog.patch
@@ -0,0 +1,56 @@
+From 70414cacbe536a197d56f58a42f9563e5a01b8ec Mon Sep 17 00:00:00 2001
+From: David Vernet <void@manifault.com>
+Date: Mon, 9 Dec 2024 09:29:24 -0600
+Subject: [PATCH] scx: Fix maximal BPF selftest prog
+
+maximal.bpf.c is still dispatching to and consuming from SCX_DSQ_GLOBAL.
+Let's have it use its own DSQ to avoid any runtime errors.
+
+Signed-off-by: David Vernet <void@manifault.com>
+---
+ tools/testing/selftests/sched_ext/maximal.bpf.c | 8 +++++---
+ 1 file changed, 5 insertions(+), 3 deletions(-)
+
+diff --git a/tools/testing/selftests/sched_ext/maximal.bpf.c b/tools/testing/selftests/sched_ext/maximal.bpf.c
+index 4c005fa71810..430f5e13bf55 100644
+--- a/tools/testing/selftests/sched_ext/maximal.bpf.c
++++ b/tools/testing/selftests/sched_ext/maximal.bpf.c
+@@ -12,6 +12,8 @@
+ 
+ char _license[] SEC("license") = "GPL";
+ 
++#define DSQ_ID 0
++
+ s32 BPF_STRUCT_OPS(maximal_select_cpu, struct task_struct *p, s32 prev_cpu,
+ 		   u64 wake_flags)
+ {
+@@ -20,7 +22,7 @@ s32 BPF_STRUCT_OPS(maximal_select_cpu, struct task_struct *p, s32 prev_cpu,
+ 
+ void BPF_STRUCT_OPS(maximal_enqueue, struct task_struct *p, u64 enq_flags)
+ {
+-	scx_bpf_dsq_insert(p, SCX_DSQ_GLOBAL, SCX_SLICE_DFL, enq_flags);
++	scx_bpf_dsq_insert(p, DSQ_ID, SCX_SLICE_DFL, enq_flags);
+ }
+ 
+ void BPF_STRUCT_OPS(maximal_dequeue, struct task_struct *p, u64 deq_flags)
+@@ -28,7 +30,7 @@ void BPF_STRUCT_OPS(maximal_dequeue, struct task_struct *p, u64 deq_flags)
+ 
+ void BPF_STRUCT_OPS(maximal_dispatch, s32 cpu, struct task_struct *prev)
+ {
+-	scx_bpf_dsq_move_to_local(SCX_DSQ_GLOBAL);
++	scx_bpf_dsq_move_to_local(DSQ_ID);
+ }
+ 
+ void BPF_STRUCT_OPS(maximal_runnable, struct task_struct *p, u64 enq_flags)
+@@ -123,7 +125,7 @@ void BPF_STRUCT_OPS(maximal_cgroup_set_weight, struct cgroup *cgrp, u32 weight)
+ 
+ s32 BPF_STRUCT_OPS_SLEEPABLE(maximal_init)
+ {
+-	return 0;
++	return scx_bpf_create_dsq(DSQ_ID, -1);
+ }
+ 
+ void BPF_STRUCT_OPS(maximal_exit, struct scx_exit_info *info)
+-- 
+2.47.1
+
diff --git a/ci/vmtest/configs/DENYLIST b/ci/vmtest/configs/DENYLIST
new file mode 100644
index 0000000000000..2f9bf5c0aa016
--- /dev/null
+++ b/ci/vmtest/configs/DENYLIST
@@ -0,0 +1,15 @@
+# TEMPORARY
+btf_dump/btf_dump: syntax
+kprobe_multi_bench_attach
+core_reloc/enum64val
+core_reloc/size___diff_sz
+core_reloc/type_based___diff_sz
+test_ima	# All of CI is broken on it following 6.3-rc1 merge
+
+lwt_reroute      # crashes kernel after netnext merge from 2ab1efad60ad "net/sched: cls_api: complement tcf_tfilter_dump_policy"
+tc_links_ingress # started failing after net-next merge from 2ab1efad60ad "net/sched: cls_api: complement tcf_tfilter_dump_policy"
+xdp_bonding/xdp_bonding_features     # started failing after net merge from 359e54a93ab4 "l2tp: pass correct message length to ip6_append_data"
+tc_redirect/tc_redirect_dtime # uapi breakage after net-next commit 885c36e59f46 ("net: Re-use and set mono_delivery_time bit for userspace tstamp packets")
+migrate_reuseport/IPv4 TCP_NEW_SYN_RECV reqsk_timer_handler # flaky, under investigation
+migrate_reuseport/IPv6 TCP_NEW_SYN_RECV reqsk_timer_handler # flaky, under investigation
+connect_force_port # unreliably fails
diff --git a/ci/vmtest/configs/DENYLIST.aarch64 b/ci/vmtest/configs/DENYLIST.aarch64
new file mode 100644
index 0000000000000..487b19ede4b61
--- /dev/null
+++ b/ci/vmtest/configs/DENYLIST.aarch64
@@ -0,0 +1,4 @@
+cgrp_local_storage                  # libbpf: prog 'update_cookie_tracing': failed to attach: ERROR: strerror_r(-524)=22
+core_reloc_btfgen                   # run_core_reloc_tests:FAIL:run_btfgen unexpected error: 32512 (errno 22)
+usdt/multispec                      # usdt_300_bad_attach unexpected pointer: 0x558c63d8f0
+xdp_bonding                         # whole test suite is very unstable on aarch64
diff --git a/ci/vmtest/configs/DENYLIST.rc b/ci/vmtest/configs/DENYLIST.rc
new file mode 100644
index 0000000000000..8aa33e6b71443
--- /dev/null
+++ b/ci/vmtest/configs/DENYLIST.rc
@@ -0,0 +1,3 @@
+send_signal/send_signal_nmi            # PMU events configure correctly but don't trigger NMI's for some reason (AMD nested virt)
+send_signal/send_signal_nmi_thread     # Same as above
+token/obj_priv_implicit_token_envvar   # Unknown root cause, but reliably fails
diff --git a/ci/vmtest/configs/DENYLIST.s390x b/ci/vmtest/configs/DENYLIST.s390x
new file mode 100644
index 0000000000000..9b90b615aea55
--- /dev/null
+++ b/ci/vmtest/configs/DENYLIST.s390x
@@ -0,0 +1,11 @@
+deny_namespace                           # not yet in bpf denylist
+tc_redirect/tc_redirect_dtime            # very flaky
+lru_bug                                  # not yet in bpf-next denylist
+# Disabled temporarily for a crash.
+# https://lore.kernel.org/bpf/c9923c1d-971d-4022-8dc8-1364e929d34c@gmail.com/
+dummy_st_ops/dummy_init_ptr_arg
+fexit_bpf2bpf
+tailcalls
+trace_ext
+xdp_bpf2bpf
+xdp_metadata
diff --git a/ci/vmtest/configs/DENYLIST.test_progs-bpf_gcc b/ci/vmtest/configs/DENYLIST.test_progs-bpf_gcc
new file mode 100644
index 0000000000000..a3c745d1f5b52
--- /dev/null
+++ b/ci/vmtest/configs/DENYLIST.test_progs-bpf_gcc
@@ -0,0 +1,904 @@
+arena_htab
+async_stack_depth
+bad_struct_ops/invalid_prog_reuse
+bpf_cookie
+bpf_iter/bpf_hash_map
+bpf_iter/ksym
+bpf_iter/tcp4
+bpf_iter/tcp6
+bpf_iter/udp4
+bpf_iter/udp6
+bpf_iter/unix
+bpf_iter_setsockopt
+bpf_iter_setsockopt_unix
+bpf_mod_race
+bpf_nf/tc-bpf-ct
+bpf_nf/xdp-ct
+bpf_tcp_ca/cubic
+btf_dump/btf_dump: bitfields
+btf_dump/btf_dump: packing
+btf_dump/btf_dump: padding
+btf_dump/btf_dump: syntax
+btf_map_in_map
+cb_refs
+cgroup_get_current_cgroup_id
+cgroup_iter/cgroup_iter__self_only_css_task
+cgroup_tcp_skb
+cgrp_kfunc
+cls_redirect/cls_redirect_dynptr
+connect_force_port
+core_autosize
+core_read_macros
+core_reloc/type_id
+core_reloc/type_id___missing_targets
+core_reloc_btfgen/type_id
+core_reloc_btfgen/type_id___missing_targets
+cpumask/test_acquire_wrong_cpumask
+cpumask/test_alloc_double_release
+cpumask/test_alloc_free_cpumask
+cpumask/test_alloc_no_release
+cpumask/test_and_or_xor
+cpumask/test_copy_any_anyand
+cpumask/test_cpumask_null
+cpumask/test_cpumask_weight
+cpumask/test_first_firstzero_cpu
+cpumask/test_firstand_nocpu
+cpumask/test_global_mask_array_l2_rcu
+cpumask/test_global_mask_array_one_rcu
+cpumask/test_global_mask_array_rcu
+cpumask/test_global_mask_nested_deep_array_rcu
+cpumask/test_global_mask_nested_deep_rcu
+cpumask/test_global_mask_nested_rcu
+cpumask/test_global_mask_no_null_check
+cpumask/test_global_mask_out_of_rcu
+cpumask/test_global_mask_rcu
+cpumask/test_global_mask_rcu_no_null_check
+cpumask/test_insert_leave
+cpumask/test_insert_remove_no_release
+cpumask/test_insert_remove_release
+cpumask/test_intersects_subset
+cpumask/test_invalid_nested_array
+cpumask/test_mutate_cpumask
+cpumask/test_set_clear_cpu
+cpumask/test_setall_clear_cpu
+cpumask/test_test_and_set_clear
+crypto_basic/crypto_acquire
+crypto_sanity
+deny_namespace
+dummy_st_ops/test_unsupported_field_sleepable
+dynptr/add_dynptr_to_map1
+dynptr/add_dynptr_to_map2
+dynptr/clone_invalid1
+dynptr/clone_invalid2
+dynptr/clone_invalidate1
+dynptr/clone_invalidate2
+dynptr/clone_invalidate3
+dynptr/clone_invalidate4
+dynptr/clone_invalidate5
+dynptr/clone_invalidate6
+dynptr/clone_skb_packet_data
+dynptr/clone_xdp_packet_data
+dynptr/data_slice_missing_null_check1
+dynptr/data_slice_missing_null_check2
+dynptr/data_slice_out_of_bounds_map_value
+dynptr/data_slice_out_of_bounds_ringbuf
+dynptr/data_slice_out_of_bounds_skb
+dynptr/data_slice_use_after_release1
+dynptr/data_slice_use_after_release2
+dynptr/dynptr_adjust_invalid
+dynptr/dynptr_from_mem_invalid_api
+dynptr/dynptr_invalidate_slice_failure
+dynptr/dynptr_invalidate_slice_or_null
+dynptr/dynptr_invalidate_slice_reinit
+dynptr/dynptr_is_null_invalid
+dynptr/dynptr_is_rdonly_invalid
+dynptr/dynptr_overwrite_ref
+dynptr/dynptr_partial_slot_invalidate
+dynptr/dynptr_pruning_overwrite
+dynptr/dynptr_pruning_type_confusion
+dynptr/dynptr_read_into_slot
+dynptr/dynptr_size_invalid
+dynptr/dynptr_slice_var_len1
+dynptr/dynptr_slice_var_len2
+dynptr/dynptr_var_off_overwrite
+dynptr/global
+dynptr/invalid_data_slices
+dynptr/invalid_helper1
+dynptr/invalid_helper2
+dynptr/invalid_offset
+dynptr/invalid_read1
+dynptr/invalid_read2
+dynptr/invalid_read3
+dynptr/invalid_read4
+dynptr/invalid_slice_rdwr_rdonly
+dynptr/invalid_write1
+dynptr/invalid_write2
+dynptr/invalid_write3
+dynptr/invalid_write4
+dynptr/release_twice
+dynptr/release_twice_callback
+dynptr/ringbuf_invalid_api
+dynptr/ringbuf_missing_release1
+dynptr/ringbuf_missing_release2
+dynptr/ringbuf_missing_release_callback
+dynptr/ringbuf_release_uninit_dynptr
+dynptr/skb_invalid_ctx
+dynptr/skb_invalid_ctx_fentry
+dynptr/skb_invalid_ctx_fexit
+dynptr/skb_invalid_data_slice1
+dynptr/skb_invalid_data_slice2
+dynptr/skb_invalid_data_slice3
+dynptr/skb_invalid_data_slice4
+dynptr/skb_invalid_slice_write
+dynptr/test_dynptr_reg_type
+dynptr/test_dynptr_skb_no_buff
+dynptr/test_dynptr_skb_small_buff
+dynptr/test_dynptr_skb_tp_btf
+dynptr/test_read_write
+dynptr/uninit_write_into_slot
+dynptr/use_after_invalid
+dynptr/xdp_invalid_ctx
+dynptr/xdp_invalid_data_slice1
+dynptr/xdp_invalid_data_slice2
+exceptions/check_assert_eq_int_max
+exceptions/check_assert_eq_int_min
+exceptions/check_assert_eq_llong_max
+exceptions/check_assert_eq_llong_min
+exceptions/check_assert_eq_zero
+exceptions/check_assert_ge_neg
+exceptions/check_assert_ge_pos
+exceptions/check_assert_ge_zero
+exceptions/check_assert_generic
+exceptions/check_assert_gt_neg
+exceptions/check_assert_gt_pos
+exceptions/check_assert_gt_zero
+exceptions/check_assert_le_neg
+exceptions/check_assert_le_pos
+exceptions/check_assert_le_zero
+exceptions/check_assert_lt_neg
+exceptions/check_assert_lt_pos
+exceptions/check_assert_lt_zero
+exceptions/check_assert_range_s64
+exceptions/check_assert_range_u64
+exceptions/check_assert_single_range_s64
+exceptions/check_assert_single_range_u64
+exceptions/check_assert_with_return
+exceptions/exception_ext
+exceptions/exception_ext_mod_cb_runtime
+exceptions/non-throwing extension -> non-throwing subprog
+exceptions/non-throwing extension -> throwing global subprog
+exceptions/non-throwing fentry -> exception_cb
+exceptions/non-throwing fexit -> exception_cb
+exceptions/non-throwing fmod_ret -> non-throwing global subprog
+exceptions/reject_async_callback_throw
+exceptions/reject_exception_throw_cb
+exceptions/reject_exception_throw_cb_diff
+exceptions/reject_set_exception_cb_bad_ret2
+exceptions/reject_subprog_with_lock
+exceptions/reject_subprog_with_rcu_read_lock
+exceptions/reject_with_cb
+exceptions/reject_with_cb_reference
+exceptions/reject_with_lock
+exceptions/reject_with_rbtree_add_throw
+exceptions/reject_with_rcu_read_lock
+exceptions/reject_with_reference
+exceptions/reject_with_subprog_reference
+exceptions/throwing extension (with custom cb) -> exception_cb
+exceptions/throwing extension -> global func in exception_cb
+exceptions/throwing extension -> non-throwing global subprog
+exceptions/throwing extension -> throwing global subprog
+exceptions/throwing fentry -> exception_cb
+exceptions/throwing fexit -> exception_cb
+failures_wq
+fexit_bpf2bpf/fmod_ret_freplace
+fexit_bpf2bpf/func_replace
+fexit_bpf2bpf/func_replace_global_func
+fexit_bpf2bpf/func_replace_multi
+fexit_bpf2bpf/func_sockmap_update
+fexit_bpf2bpf/target_yes_callees
+global_func_dead_code
+global_map_resize
+inner_array_lookup
+irq/irq_flag_overwrite
+irq/irq_flag_overwrite_partial
+irq/irq_global_subprog
+irq/irq_ooo_refs_array
+irq/irq_restore_4_subprog
+irq/irq_restore_bad_arg
+irq/irq_restore_invalid
+irq/irq_restore_iter
+irq/irq_restore_missing_1_subprog
+irq/irq_restore_missing_2
+irq/irq_restore_missing_2_subprog
+irq/irq_restore_missing_3
+irq/irq_restore_missing_3_minus_2
+irq/irq_restore_missing_3_minus_2_subprog
+irq/irq_restore_missing_3_subprog
+irq/irq_restore_ooo
+irq/irq_restore_ooo_3
+irq/irq_restore_ooo_3_subprog
+irq/irq_save_bad_arg
+irq/irq_save_invalid
+irq/irq_save_iter
+irq/irq_sleepable_helper
+irq/irq_sleepable_kfunc
+iters/compromise_iter_w_direct_write_and_skip_destroy_fail
+iters/compromise_iter_w_direct_write_fail
+iters/compromise_iter_w_helper_write_fail
+iters/create_and_forget_to_destroy_fail
+iters/css_task
+iters/delayed_precision_mark
+iters/delayed_read_mark
+iters/destroy_without_creating_fail
+iters/double_create_fail
+iters/double_destroy_fail
+iters/iter_css_lock_and_unlock
+iters/iter_css_task_for_each
+iters/iter_css_without_lock
+iters/iter_destroy_bad_arg
+iters/iter_err_too_permissive1
+iters/iter_err_too_permissive2
+iters/iter_err_too_permissive3
+iters/iter_err_unsafe_asm_loop
+iters/iter_err_unsafe_c_loop
+iters/iter_nested_iters
+iters/iter_new_bad_arg
+iters/iter_next_bad_arg
+iters/iter_next_ptr_mem_not_trusted
+iters/iter_next_rcu_not_trusted
+iters/iter_next_rcu_or_null
+iters/iter_next_trusted_or_null
+iters/iter_obfuscate_counter
+iters/iter_subprog_iters
+iters/iter_tasks_lock_and_unlock
+iters/iter_tasks_without_lock
+iters/leak_iter_from_subprog_fail
+iters/loop_state_deps1
+iters/loop_state_deps2
+iters/missing_null_check_fail
+iters/next_after_destroy_fail
+iters/next_without_new_fail
+iters/read_from_iter_slot_fail
+iters/stacksafe_should_not_conflate_stack_spill_and_iter
+iters/testmod_seq_getter_after_bad
+iters/testmod_seq_getter_before_bad
+iters/wrong_sized_read_fail
+jeq_infer_not_null
+jit_probe_mem
+kfree_skb
+kfunc_call/kfunc_call_ctx
+kfunc_call/kfunc_call_test1
+kfunc_call/kfunc_call_test2
+kfunc_call/kfunc_call_test4
+kfunc_call/kfunc_call_test_get_mem
+kfunc_call/kfunc_call_test_ref_btf_id
+kfunc_call/kfunc_call_test_static_unused_arg
+kfunc_call/kfunc_syscall_test
+kfunc_call/kfunc_syscall_test_null
+kfunc_dynptr_param/not_ptr_to_stack
+kfunc_dynptr_param/not_valid_dynptr
+kfunc_param_nullable/kfunc_dynptr_nullable_test3
+kprobe_multi_test/kprobe_session_return_2
+kptr_xchg_inline
+l4lb_all/l4lb_noinline
+l4lb_all/l4lb_noinline_dynptr
+linked_list
+local_kptr_stash/drop_rb_node_off
+local_kptr_stash/local_kptr_stash_local_with_root
+local_kptr_stash/local_kptr_stash_plain
+local_kptr_stash/local_kptr_stash_simple
+local_kptr_stash/local_kptr_stash_unstash
+local_kptr_stash/refcount_acquire_without_unstash
+local_kptr_stash/stash_rb_nodes
+log_buf/obj_load_log_buf
+log_fixup/bad_core_relo_subprog
+log_fixup/bad_core_relo_trunc_full
+lru_bug
+map_btf
+map_in_map/acc_map_in_array
+map_in_map/acc_map_in_htab
+map_in_map/sleepable_acc_map_in_array
+map_in_map/sleepable_acc_map_in_htab
+map_kptr/correct_btf_id_check_size
+map_kptr/inherit_untrusted_on_walk
+map_kptr/kptr_xchg_possibly_null
+map_kptr/kptr_xchg_ref_state
+map_kptr/mark_ref_as_untrusted_or_null
+map_kptr/marked_as_untrusted_or_null
+map_kptr/non_const_var_off
+map_kptr/non_const_var_off_kptr_xchg
+map_kptr/reject_bad_type_xchg
+map_kptr/reject_kptr_xchg_on_unref
+map_kptr/reject_member_of_ref_xchg
+map_kptr/reject_untrusted_xchg
+map_kptr/success-map
+map_ptr
+nested_trust/test_invalid_nested_user_cpus
+nested_trust/test_invalid_skb_field
+percpu_alloc/array
+percpu_alloc/array_sleepable
+percpu_alloc/cgrp_local_storage
+percpu_alloc/test_array_map_1
+percpu_alloc/test_array_map_2
+percpu_alloc/test_array_map_3
+percpu_alloc/test_array_map_4
+percpu_alloc/test_array_map_5
+percpu_alloc/test_array_map_6
+percpu_alloc/test_array_map_7
+percpu_alloc/test_array_map_8
+perf_branches/perf_branches_no_hw
+pkt_access
+preempt_lock/preempt_global_subprog_test
+preempt_lock/preempt_lock_missing_1
+preempt_lock/preempt_lock_missing_1_subprog
+preempt_lock/preempt_lock_missing_2
+preempt_lock/preempt_lock_missing_2_minus_1_subprog
+preempt_lock/preempt_lock_missing_2_subprog
+preempt_lock/preempt_lock_missing_3
+preempt_lock/preempt_lock_missing_3_minus_2
+preempt_lock/preempt_sleepable_helper
+preempt_lock/preempt_sleepable_kfunc
+preempted_bpf_ma_op
+prog_run_opts
+prog_tests_framework
+raw_tp_null
+rbtree_fail
+rbtree_success
+recursion
+refcounted_kptr
+refcounted_kptr_fail
+refcounted_kptr_wrong_owner
+reference_tracking/sk_lookup_success
+ringbuf_multi
+setget_sockopt
+sk_lookup
+skc_to_unix_sock
+sock_addr/recvmsg4: attach prog with wrong attach type
+sock_addr/recvmsg4: recvfrom (dgram)
+sock_addr/recvmsg6: attach prog with wrong attach type
+sock_addr/recvmsg6: recvfrom (dgram)
+sock_addr/sendmsg4: attach prog with wrong attach type
+sock_addr/sendmsg4: kernel_sendmsg (dgram)
+sock_addr/sendmsg4: kernel_sendmsg deny (dgram)
+sock_addr/sendmsg4: sendmsg (dgram)
+sock_addr/sendmsg4: sendmsg deny (dgram)
+sock_addr/sendmsg4: sock_sendmsg (dgram)
+sock_addr/sendmsg4: sock_sendmsg deny (dgram)
+sock_addr/sendmsg6: attach prog with wrong attach type
+sock_addr/sendmsg6: kernel_sendmsg (dgram)
+sock_addr/sendmsg6: kernel_sendmsg [::] (BSD'ism) (dgram)
+sock_addr/sendmsg6: kernel_sendmsg deny (dgram)
+sock_addr/sendmsg6: sendmsg (dgram)
+sock_addr/sendmsg6: sendmsg IPv4-mapped IPv6 (dgram)
+sock_addr/sendmsg6: sendmsg [::] (BSD'ism) (dgram)
+sock_addr/sendmsg6: sendmsg deny (dgram)
+sock_addr/sendmsg6: sendmsg dst IP = [::] (BSD'ism) (dgram)
+sock_addr/sendmsg6: sock_sendmsg (dgram)
+sock_addr/sendmsg6: sock_sendmsg [::] (BSD'ism) (dgram)
+sock_addr/sendmsg6: sock_sendmsg deny (dgram)
+sock_destroy/trace_tcp_destroy_sock
+sock_fields
+sockmap_listen/sockhash IPv4 TCP test_reuseport_mixed_groups
+sockmap_listen/sockhash IPv4 TCP test_reuseport_select_connected
+sockmap_listen/sockhash IPv4 UDP test_reuseport_mixed_groups
+sockmap_listen/sockhash IPv4 UDP test_reuseport_select_connected
+sockmap_listen/sockhash IPv6 TCP test_reuseport_mixed_groups
+sockmap_listen/sockhash IPv6 TCP test_reuseport_select_connected
+sockmap_listen/sockhash IPv6 UDP test_reuseport_mixed_groups
+sockmap_listen/sockhash IPv6 UDP test_reuseport_select_connected
+sockmap_listen/sockmap IPv4 TCP test_reuseport_mixed_groups
+sockmap_listen/sockmap IPv4 TCP test_reuseport_select_connected
+sockmap_listen/sockmap IPv4 UDP test_reuseport_mixed_groups
+sockmap_listen/sockmap IPv4 UDP test_reuseport_select_connected
+sockmap_listen/sockmap IPv6 TCP test_reuseport_mixed_groups
+sockmap_listen/sockmap IPv6 TCP test_reuseport_select_connected
+sockmap_listen/sockmap IPv6 UDP test_reuseport_mixed_groups
+sockmap_listen/sockmap IPv6 UDP test_reuseport_select_connected
+spin_lock
+struct_ops_module/unsupported_ops
+syscall
+tailcalls/classifier_0
+tailcalls/classifier_1
+tailcalls/reject_tail_call_preempt_lock
+tailcalls/reject_tail_call_rcu_lock
+tailcalls/reject_tail_call_ref
+tailcalls/reject_tail_call_spin_lock
+tailcalls/tailcall_6
+tailcalls/tailcall_bpf2bpf_2
+tailcalls/tailcall_bpf2bpf_3
+tailcalls/tailcall_bpf2bpf_fentry
+tailcalls/tailcall_bpf2bpf_fentry_entry
+tailcalls/tailcall_bpf2bpf_fentry_fexit
+tailcalls/tailcall_bpf2bpf_fexit
+tailcalls/tailcall_bpf2bpf_hierarchy_2
+tailcalls/tailcall_bpf2bpf_hierarchy_3
+task_kfunc
+task_local_storage/uptr_across_pages
+task_local_storage/uptr_basic
+task_local_storage/uptr_kptr_xchg
+task_local_storage/uptr_map_failure_e2big
+task_local_storage/uptr_map_failure_kstruct
+task_local_storage/uptr_map_failure_size0
+task_local_storage/uptr_no_null_check
+task_local_storage/uptr_obj_new
+task_local_storage/uptr_update_failure
+tc_bpf/tc_bpf_non_root
+tc_redirect/tc_redirect_dtime
+tcp_custom_syncookie
+tcp_hdr_options
+test_bpf_ma
+test_global_funcs/arg_tag_ctx_kprobe
+test_global_funcs/arg_tag_ctx_perf
+test_global_funcs/arg_tag_ctx_raw_tp
+test_global_funcs/global_func1
+test_global_funcs/global_func10
+test_global_funcs/global_func11
+test_global_funcs/global_func12
+test_global_funcs/global_func13
+test_global_funcs/global_func14
+test_global_funcs/global_func15
+test_global_funcs/global_func15_tricky_pruning
+test_global_funcs/global_func17
+test_global_funcs/global_func3
+test_global_funcs/global_func5
+test_global_funcs/global_func6
+test_global_funcs/global_func7
+test_lsm/lsm_basic
+test_profiler
+test_strncmp/strncmp_bad_not_null_term_target
+timer
+timer_mim
+token
+tp_btf_nullable/handle_tp_btf_nullable_bare1
+tunnel
+uprobe_multi_test/uprobe_sesison_return_2
+user_ringbuf/user_ringbuf_callback_bad_access1
+user_ringbuf/user_ringbuf_callback_bad_access2
+user_ringbuf/user_ringbuf_callback_const_ptr_to_dynptr_reg_off
+user_ringbuf/user_ringbuf_callback_discard_dynptr
+user_ringbuf/user_ringbuf_callback_invalid_return
+user_ringbuf/user_ringbuf_callback_null_context_read
+user_ringbuf/user_ringbuf_callback_null_context_write
+user_ringbuf/user_ringbuf_callback_reinit_dynptr_mem
+user_ringbuf/user_ringbuf_callback_reinit_dynptr_ringbuf
+user_ringbuf/user_ringbuf_callback_submit_dynptr
+user_ringbuf/user_ringbuf_callback_write_forbidden
+verif_scale_pyperf100
+verif_scale_pyperf180
+verif_scale_pyperf600
+verif_scale_pyperf600_nounroll
+verif_scale_seg6_loop
+verif_scale_strobemeta
+verif_scale_strobemeta_nounroll1
+verif_scale_strobemeta_nounroll2
+verif_scale_strobemeta_subprogs
+verif_scale_sysctl_loop1
+verif_scale_sysctl_loop2
+verif_scale_xdp_loop
+verifier_and/invalid_and_of_negative_number
+verifier_and/invalid_range_check
+verifier_arena/iter_maps2
+verifier_arena/iter_maps3
+verifier_array_access/a_read_only_array_1_2
+verifier_array_access/a_read_only_array_2_2
+verifier_array_access/a_write_only_array_1_2
+verifier_array_access/a_write_only_array_2_2
+verifier_array_access/an_array_with_a_constant_2
+verifier_array_access/an_array_with_a_register_2
+verifier_array_access/an_array_with_a_variable_2
+verifier_array_access/array_with_no_floor_check
+verifier_array_access/with_a_invalid_max_check_1
+verifier_array_access/with_a_invalid_max_check_2
+verifier_basic_stack/invalid_fp_arithmetic
+verifier_basic_stack/misaligned_read_from_stack
+verifier_basic_stack/stack_out_of_bounds
+verifier_bitfield_write
+verifier_bits_iter/destroy_uninit
+verifier_bits_iter/next_uninit
+verifier_bits_iter/no_destroy
+verifier_bounds/bounds_map_value_variant_1
+verifier_bounds/bounds_map_value_variant_2
+verifier_bounds/of_boundary_crossing_range_1
+verifier_bounds/of_boundary_crossing_range_2
+verifier_bounds/on_sign_extended_mov_test1
+verifier_bounds/on_sign_extended_mov_test2
+verifier_bounds/reg32_any_reg32_xor_3
+verifier_bounds/reg_any_reg_xor_3
+verifier_bounds/shift_of_maybe_negative_number
+verifier_bounds/shift_with_64_bit_input
+verifier_bounds/shift_with_oversized_count_operand
+verifier_bounds/size_signed_32bit_overflow_test1
+verifier_bounds/size_signed_32bit_overflow_test2
+verifier_bounds/size_signed_32bit_overflow_test3
+verifier_bounds/size_signed_32bit_overflow_test4
+verifier_bounds/var_off_insn_off_test1
+verifier_bounds/var_off_insn_off_test2
+verifier_bounds_deduction/deducing_bounds_from_const_1
+verifier_bounds_deduction/deducing_bounds_from_const_10
+verifier_bounds_deduction/deducing_bounds_from_const_3
+verifier_bounds_deduction/deducing_bounds_from_const_5
+verifier_bounds_deduction/deducing_bounds_from_const_6
+verifier_bounds_deduction/deducing_bounds_from_const_7
+verifier_bounds_deduction/deducing_bounds_from_const_8
+verifier_bounds_deduction/deducing_bounds_from_const_9
+verifier_bounds_mix_sign_unsign/checks_mixing_signed_and_unsigned
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_positive_bounds
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_10
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_11
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_12
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_13
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_14
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_15
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_2
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_3
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_5
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_6
+verifier_bounds_mix_sign_unsign/signed_and_unsigned_variant_8
+verifier_btf_ctx_access/ctx_access_u32_pointer_reject_16
+verifier_btf_ctx_access/ctx_access_u32_pointer_reject_32
+verifier_btf_ctx_access/ctx_access_u32_pointer_reject_8
+verifier_cfg/conditional_loop
+verifier_cfg/loop2_back_edge
+verifier_cfg/loop_back_edge
+verifier_cfg/out_of_range_jump
+verifier_cfg/out_of_range_jump2
+verifier_cfg/uncond_loop_after_cond_jmp
+verifier_cfg/uncond_loop_in_subprog_after_cond_jmp
+verifier_cfg/unreachable
+verifier_cfg/unreachable2
+verifier_cgroup_inv_retcode/with_invalid_return_code_test1
+verifier_cgroup_inv_retcode/with_invalid_return_code_test3
+verifier_cgroup_inv_retcode/with_invalid_return_code_test5
+verifier_cgroup_inv_retcode/with_invalid_return_code_test6
+verifier_cgroup_inv_retcode/with_invalid_return_code_test7
+verifier_cgroup_skb/data_meta_for_cgroup_skb
+verifier_cgroup_skb/flow_keys_for_cgroup_skb
+verifier_cgroup_skb/napi_id_for_cgroup_skb
+verifier_cgroup_skb/tc_classid_for_cgroup_skb
+verifier_cgroup_storage/cpu_cgroup_storage_access_1
+verifier_cgroup_storage/cpu_cgroup_storage_access_2
+verifier_cgroup_storage/cpu_cgroup_storage_access_3
+verifier_cgroup_storage/cpu_cgroup_storage_access_4
+verifier_cgroup_storage/cpu_cgroup_storage_access_5
+verifier_cgroup_storage/cpu_cgroup_storage_access_6
+verifier_cgroup_storage/invalid_cgroup_storage_access_1
+verifier_cgroup_storage/invalid_cgroup_storage_access_2
+verifier_cgroup_storage/invalid_cgroup_storage_access_3
+verifier_cgroup_storage/invalid_cgroup_storage_access_4
+verifier_cgroup_storage/invalid_cgroup_storage_access_5
+verifier_cgroup_storage/invalid_cgroup_storage_access_6
+verifier_const/bprm
+verifier_const/tcx1
+verifier_const/tcx4
+verifier_const/tcx7
+verifier_const_or/not_bypass_stack_boundary_checks_1
+verifier_const_or/not_bypass_stack_boundary_checks_2
+verifier_ctx/context_stores_via_bpf_atomic
+verifier_ctx/ctx_pointer_to_helper_1
+verifier_ctx/ctx_pointer_to_helper_2
+verifier_ctx/ctx_pointer_to_helper_3
+verifier_ctx/make_ptr_to_ctx_unusable
+verifier_ctx/null_check_4_ctx_const
+verifier_ctx/null_check_8_null_bind
+verifier_ctx/or_null_check_3_1
+verifier_ctx_sk_msg/of_size_in_sk_msg
+verifier_ctx_sk_msg/past_end_of_sk_msg
+verifier_ctx_sk_msg/read_offset_in_sk_msg
+verifier_d_path/d_path_reject
+verifier_direct_packet_access/access_test15_spill_with_xadd
+verifier_direct_packet_access/direct_packet_access_test3
+verifier_direct_packet_access/id_in_regsafe_bad_access
+verifier_direct_packet_access/packet_access_test10_write_invalid
+verifier_direct_packet_access/pkt_end_reg_bad_access
+verifier_direct_packet_access/pkt_end_reg_both_accesses
+verifier_direct_packet_access/test16_arith_on_data_end
+verifier_direct_packet_access/test23_x_pkt_ptr_4
+verifier_direct_packet_access/test26_marking_on_bad_access
+verifier_direct_packet_access/test28_marking_on_bad_access
+verifier_direct_stack_access_wraparound
+verifier_global_ptr_args
+verifier_global_subprogs
+verifier_helper_access_var_len/bitwise_and_jmp_wrong_max
+verifier_helper_access_var_len/jmp_signed_no_min_check
+verifier_helper_access_var_len/map_adjusted_jmp_wrong_max
+verifier_helper_access_var_len/memory_map_jmp_wrong_max
+verifier_helper_access_var_len/memory_stack_jmp_bounds_offset
+verifier_helper_access_var_len/memory_stack_jmp_wrong_max
+verifier_helper_access_var_len/ptr_to_mem_or_null_2
+verifier_helper_access_var_len/ptr_to_mem_or_null_8
+verifier_helper_access_var_len/ptr_to_mem_or_null_9
+verifier_helper_access_var_len/stack_jmp_no_max_check
+verifier_helper_packet_access/cls_helper_fail_range_1
+verifier_helper_packet_access/cls_helper_fail_range_2
+verifier_helper_packet_access/cls_helper_fail_range_3
+verifier_helper_packet_access/packet_ptr_with_bad_range_1
+verifier_helper_packet_access/packet_ptr_with_bad_range_2
+verifier_helper_packet_access/packet_test2_unchecked_packet_ptr
+verifier_helper_packet_access/ptr_with_too_short_range_1
+verifier_helper_packet_access/ptr_with_too_short_range_2
+verifier_helper_packet_access/test11_cls_unsuitable_helper_1
+verifier_helper_packet_access/test12_cls_unsuitable_helper_2
+verifier_helper_packet_access/test15_cls_helper_fail_sub
+verifier_helper_packet_access/test20_pkt_end_as_input
+verifier_helper_packet_access/test7_cls_unchecked_packet_ptr
+verifier_helper_packet_access/to_packet_test21_wrong_reg
+verifier_helper_restricted
+verifier_helper_value_access/access_to_map_empty_range
+verifier_helper_value_access/access_to_map_negative_range
+verifier_helper_value_access/access_to_map_possibly_empty_range
+verifier_helper_value_access/access_to_map_wrong_size
+verifier_helper_value_access/bounds_check_using_bad_access_1
+verifier_helper_value_access/bounds_check_using_bad_access_2
+verifier_helper_value_access/check_using_s_bad_access_1
+verifier_helper_value_access/check_using_s_bad_access_2
+verifier_helper_value_access/const_imm_negative_range_adjustment_1
+verifier_helper_value_access/const_imm_negative_range_adjustment_2
+verifier_helper_value_access/const_reg_negative_range_adjustment_1
+verifier_helper_value_access/const_reg_negative_range_adjustment_2
+verifier_helper_value_access/imm_out_of_bound_1
+verifier_helper_value_access/imm_out_of_bound_2
+verifier_helper_value_access/imm_out_of_bound_range
+verifier_helper_value_access/map_out_of_bound_range
+verifier_helper_value_access/map_via_variable_empty_range
+verifier_helper_value_access/reg_out_of_bound_1
+verifier_helper_value_access/reg_out_of_bound_2
+verifier_helper_value_access/reg_out_of_bound_range
+verifier_helper_value_access/via_const_imm_empty_range
+verifier_helper_value_access/via_const_reg_empty_range
+verifier_helper_value_access/via_variable_no_max_check_1
+verifier_helper_value_access/via_variable_no_max_check_2
+verifier_helper_value_access/via_variable_wrong_max_check_1
+verifier_helper_value_access/via_variable_wrong_max_check_2
+verifier_int_ptr/arg_ptr_to_long_misaligned
+verifier_int_ptr/to_long_size_sizeof_long
+verifier_iterating_callbacks/bpf_loop_iter_limit_overflow
+verifier_iterating_callbacks/check_add_const_3regs
+verifier_iterating_callbacks/check_add_const_3regs_2if
+verifier_iterating_callbacks/check_add_const_regsafe_off
+verifier_iterating_callbacks/iter_limit_bug
+verifier_iterating_callbacks/jgt_imm64_and_may_goto
+verifier_iterating_callbacks/loop_detection
+verifier_iterating_callbacks/may_goto_self
+verifier_iterating_callbacks/unsafe_find_vma
+verifier_iterating_callbacks/unsafe_for_each_map_elem
+verifier_iterating_callbacks/unsafe_on_2nd_iter
+verifier_iterating_callbacks/unsafe_on_zero_iter
+verifier_iterating_callbacks/unsafe_ringbuf_drain
+verifier_jeq_infer_not_null/unchanged_for_jeq_false_branch
+verifier_jeq_infer_not_null/unchanged_for_jne_true_branch
+verifier_kfunc_prog_types/cgrp_kfunc_raw_tp
+verifier_kfunc_prog_types/cpumask_kfunc_raw_tp
+verifier_kfunc_prog_types/task_kfunc_raw_tp
+verifier_ld_ind/ind_check_calling_conv_r1
+verifier_ld_ind/ind_check_calling_conv_r2
+verifier_ld_ind/ind_check_calling_conv_r3
+verifier_ld_ind/ind_check_calling_conv_r4
+verifier_ld_ind/ind_check_calling_conv_r5
+verifier_leak_ptr/leak_pointer_into_ctx_1
+verifier_leak_ptr/leak_pointer_into_ctx_2
+verifier_linked_scalars
+verifier_loops1/bounded_recursion
+verifier_loops1/infinite_loop_in_two_jumps
+verifier_loops1/infinite_loop_three_jump_trick
+verifier_loops1/loop_after_a_conditional_jump
+verifier_lsm/bool_retval_test3
+verifier_lsm/bool_retval_test4
+verifier_lsm/disabled_hook_test1
+verifier_lsm/disabled_hook_test2
+verifier_lsm/disabled_hook_test3
+verifier_lsm/errno_zero_retval_test4
+verifier_lsm/errno_zero_retval_test5
+verifier_lsm/errno_zero_retval_test6
+verifier_lwt/not_permitted_for_lwt_prog
+verifier_lwt/packet_write_for_lwt_in
+verifier_lwt/packet_write_for_lwt_out
+verifier_lwt/tc_classid_for_lwt_in
+verifier_lwt/tc_classid_for_lwt_out
+verifier_lwt/tc_classid_for_lwt_xmit
+verifier_map_in_map/invalid_inner_map_pointer
+verifier_map_in_map/on_the_inner_map_pointer
+verifier_map_ptr/bpf_map_ptr_write_rejected
+verifier_map_ptr/read_non_existent_field_rejected
+verifier_map_ptr/read_with_negative_offset_rejected
+verifier_map_ptr_mixing
+verifier_map_ret_val
+verifier_meta_access/meta_access_test10
+verifier_meta_access/meta_access_test2
+verifier_meta_access/meta_access_test3
+verifier_meta_access/meta_access_test4
+verifier_meta_access/meta_access_test5
+verifier_meta_access/meta_access_test6
+verifier_meta_access/meta_access_test9
+verifier_netfilter_ctx/with_invalid_ctx_access_test1
+verifier_netfilter_ctx/with_invalid_ctx_access_test2
+verifier_netfilter_ctx/with_invalid_ctx_access_test3
+verifier_netfilter_ctx/with_invalid_ctx_access_test4
+verifier_netfilter_ctx/with_invalid_ctx_access_test5
+verifier_netfilter_retcode/with_invalid_return_code_test1
+verifier_netfilter_retcode/with_invalid_return_code_test4
+verifier_or_jmp32_k
+verifier_prevent_map_lookup
+verifier_raw_stack/bytes_spilled_regs_corruption_2
+verifier_raw_stack/load_bytes_invalid_access_1
+verifier_raw_stack/load_bytes_invalid_access_2
+verifier_raw_stack/load_bytes_invalid_access_3
+verifier_raw_stack/load_bytes_invalid_access_4
+verifier_raw_stack/load_bytes_invalid_access_5
+verifier_raw_stack/load_bytes_invalid_access_6
+verifier_raw_stack/load_bytes_negative_len_2
+verifier_raw_stack/load_bytes_spilled_regs_corruption
+verifier_raw_stack/skb_load_bytes_negative_len
+verifier_raw_stack/skb_load_bytes_zero_len
+verifier_raw_tp_writable
+verifier_ref_tracking
+verifier_reg_equal/subreg_equality_2
+verifier_regalloc/regalloc_and_spill_negative
+verifier_regalloc/regalloc_negative
+verifier_regalloc/regalloc_src_reg_negative
+verifier_ringbuf/ringbuf_invalid_reservation_offset_1
+verifier_ringbuf/ringbuf_invalid_reservation_offset_2
+verifier_runtime_jit
+verifier_scalar_ids/check_ids_in_regsafe
+verifier_scalar_ids/check_ids_in_regsafe_2
+verifier_scalar_ids/linked_regs_broken_link_2
+verifier_search_pruning/for_u32_spills_u64_fill
+verifier_search_pruning/liveness_pruning_and_write_screening
+verifier_search_pruning/short_loop1
+verifier_search_pruning/should_be_verified_nop_operation
+verifier_search_pruning/tracking_for_u32_spill_fill
+verifier_search_pruning/varlen_map_value_access_pruning
+verifier_sock/bpf_sk_fullsock_skb_sk
+verifier_sock/bpf_sk_release_skb_sk
+verifier_sock/bpf_tcp_sock_skb_sk
+verifier_sock/dst_port_byte_load_invalid
+verifier_sock/dst_port_half_load_invalid_1
+verifier_sock/dst_port_half_load_invalid_2
+verifier_sock/invalidate_pkt_pointers_by_tail_call
+verifier_sock/invalidate_pkt_pointers_from_global_func
+verifier_sock/map_lookup_elem_smap_key
+verifier_sock/map_lookup_elem_sockhash_key
+verifier_sock/map_lookup_elem_sockmap_key
+verifier_sock/no_null_check_on_ret_1
+verifier_sock/no_null_check_on_ret_2
+verifier_sock/of_bpf_skc_to_helpers
+verifier_sock/post_bind4_read_mark
+verifier_sock/post_bind4_read_src_ip6
+verifier_sock/post_bind6_read_src_ip4
+verifier_sock/sk_1_1_value_1
+verifier_sock/sk_no_skb_sk_check_1
+verifier_sock/sk_no_skb_sk_check_2
+verifier_sock/sk_sk_type_fullsock_field_1
+verifier_sock/skb_sk_beyond_last_field_1
+verifier_sock/skb_sk_beyond_last_field_2
+verifier_sock/skb_sk_no_null_check
+verifier_sock/sock_create_read_src_port
+verifier_sock_addr/bind4_bad_return_code
+verifier_sock_addr/bind6_bad_return_code
+verifier_sock_addr/connect4_bad_return_code
+verifier_sock_addr/connect6_bad_return_code
+verifier_sock_addr/connect_unix_bad_return_code
+verifier_sock_addr/getpeername4_bad_return_code
+verifier_sock_addr/getpeername6_bad_return_code
+verifier_sock_addr/getpeername_unix_bad_return_code
+verifier_sock_addr/getsockname4_bad_return_code
+verifier_sock_addr/getsockname6_bad_return_code
+verifier_sock_addr/getsockname_unix_unix_bad_return_code
+verifier_sock_addr/recvmsg4_bad_return_code
+verifier_sock_addr/recvmsg6_bad_return_code
+verifier_sock_addr/recvmsg_unix_bad_return_code
+verifier_sock_addr/sendmsg4_bad_return_code
+verifier_sock_addr/sendmsg6_bad_return_code
+verifier_sock_addr/sendmsg_unix_bad_return_code
+verifier_sockmap_mutate/test_flow_dissector_update
+verifier_sockmap_mutate/test_raw_tp_delete
+verifier_sockmap_mutate/test_raw_tp_update
+verifier_sockmap_mutate/test_sockops_update
+verifier_spill_fill/_6_offset_to_skb_data
+verifier_spill_fill/addr_offset_to_skb_data
+verifier_spill_fill/check_corrupted_spill_fill
+verifier_spill_fill/fill_32bit_after_spill_64bit_clear_id
+verifier_spill_fill/spill_16bit_of_32bit_fail
+verifier_spill_fill/spill_32bit_of_64bit_fail
+verifier_spill_fill/u64_offset_to_skb_data
+verifier_spill_fill/with_invalid_reg_offset_0
+verifier_spin_lock/call_within_a_locked_region
+verifier_spin_lock/lock_test2_direct_ld_st
+verifier_spin_lock/lock_test3_direct_ld_st
+verifier_spin_lock/lock_test4_direct_ld_st
+verifier_spin_lock/lock_test7_unlock_without_lock
+verifier_spin_lock/reg_id_for_map_value
+verifier_spin_lock/spin_lock_test6_missing_unlock
+verifier_spin_lock/spin_lock_test8_double_lock
+verifier_spin_lock/spin_lock_test9_different_lock
+verifier_spin_lock/test11_ld_abs_under_lock
+verifier_stack_ptr/load_bad_alignment_on_off
+verifier_stack_ptr/load_bad_alignment_on_reg
+verifier_stack_ptr/load_out_of_bounds_high
+verifier_stack_ptr/load_out_of_bounds_low
+verifier_stack_ptr/to_stack_check_high_4
+verifier_stack_ptr/to_stack_check_high_5
+verifier_stack_ptr/to_stack_check_high_6
+verifier_stack_ptr/to_stack_check_high_7
+verifier_stack_ptr/to_stack_check_low_3
+verifier_stack_ptr/to_stack_check_low_4
+verifier_stack_ptr/to_stack_check_low_5
+verifier_stack_ptr/to_stack_check_low_6
+verifier_stack_ptr/to_stack_check_low_7
+verifier_subprog_precision/callback_precise_return_fail
+verifier_tailcall_jit
+verifier_uninit
+verifier_unpriv
+verifier_unpriv_perf
+verifier_value/store_of_cleared_call_register
+verifier_value_illegal_alu
+verifier_value_or_null/map_access_from_else_condition
+verifier_value_or_null/map_value_or_null_1
+verifier_value_or_null/map_value_or_null_2
+verifier_value_or_null/map_value_or_null_3
+verifier_value_or_null/multiple_map_lookup_elem_calls
+verifier_value_or_null/null_check_ids_in_regsafe
+verifier_value_ptr_arith/access_known_scalar_value_ptr_2
+verifier_value_ptr_arith/access_unknown_scalar_value_ptr
+verifier_value_ptr_arith/access_value_ptr_known_scalar
+verifier_value_ptr_arith/access_value_ptr_unknown_scalar
+verifier_value_ptr_arith/access_value_ptr_value_ptr_1
+verifier_value_ptr_arith/access_value_ptr_value_ptr_2
+verifier_value_ptr_arith/lower_oob_arith_test_1
+verifier_value_ptr_arith/to_leak_tainted_dst_reg
+verifier_value_ptr_arith/unknown_scalar_value_ptr_4
+verifier_value_ptr_arith/value_ptr_known_scalar_2_1
+verifier_value_ptr_arith/value_ptr_known_scalar_3
+verifier_var_off/access_max_out_of_bound
+verifier_var_off/access_min_out_of_bound
+verifier_var_off/stack_write_clobbers_spilled_regs
+verifier_var_off/variable_offset_ctx_access
+verifier_var_off/variable_offset_stack_access_unbounded
+verifier_var_off/zero_sized_access_max_out_of_bound
+verifier_vfs_reject
+verifier_xadd/xadd_w_check_unaligned_map
+verifier_xadd/xadd_w_check_unaligned_pkt
+verifier_xadd/xadd_w_check_unaligned_stack
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_1
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_10
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_11
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_12
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_13
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_14
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_15
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_16
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_2
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_3
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_4
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_5
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_6
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_7
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_8
+verifier_xdp_direct_packet_access/corner_case_1_bad_access_9
+verifier_xdp_direct_packet_access/end_mangling_bad_access_1
+verifier_xdp_direct_packet_access/end_mangling_bad_access_2
+verifier_xdp_direct_packet_access/pkt_data_bad_access_1_1
+verifier_xdp_direct_packet_access/pkt_data_bad_access_1_2
+verifier_xdp_direct_packet_access/pkt_data_bad_access_1_3
+verifier_xdp_direct_packet_access/pkt_data_bad_access_1_4
+verifier_xdp_direct_packet_access/pkt_data_bad_access_2_1
+verifier_xdp_direct_packet_access/pkt_data_bad_access_2_2
+verifier_xdp_direct_packet_access/pkt_data_bad_access_2_3
+verifier_xdp_direct_packet_access/pkt_data_bad_access_2_4
+verifier_xdp_direct_packet_access/pkt_data_bad_access_2_5
+verifier_xdp_direct_packet_access/pkt_data_bad_access_2_6
+verifier_xdp_direct_packet_access/pkt_data_bad_access_2_7
+verifier_xdp_direct_packet_access/pkt_data_bad_access_2_8
+verifier_xdp_direct_packet_access/pkt_end_bad_access_1_1
+verifier_xdp_direct_packet_access/pkt_end_bad_access_1_2
+verifier_xdp_direct_packet_access/pkt_end_bad_access_2_1
+verifier_xdp_direct_packet_access/pkt_end_bad_access_2_2
+verifier_xdp_direct_packet_access/pkt_end_bad_access_2_3
+verifier_xdp_direct_packet_access/pkt_end_bad_access_2_4
+verifier_xdp_direct_packet_access/pkt_meta_bad_access_1_1
+verifier_xdp_direct_packet_access/pkt_meta_bad_access_1_2
+verifier_xdp_direct_packet_access/pkt_meta_bad_access_2_1
+verifier_xdp_direct_packet_access/pkt_meta_bad_access_2_2
+verifier_xdp_direct_packet_access/pkt_meta_bad_access_2_3
+verifier_xdp_direct_packet_access/pkt_meta_bad_access_2_4
+verify_pkcs7_sig
+xdp_synproxy
diff --git a/ci/vmtest/configs/DENYLIST.x86_64 b/ci/vmtest/configs/DENYLIST.x86_64
new file mode 100644
index 0000000000000..6fc3413daab9f
--- /dev/null
+++ b/ci/vmtest/configs/DENYLIST.x86_64
@@ -0,0 +1 @@
+netcnt              # with kvm enabled, fail with packets unexpected packets: actual 10001 != expected 10000
diff --git a/ci/vmtest/configs/run-vmtest.env b/ci/vmtest/configs/run-vmtest.env
new file mode 100644
index 0000000000000..c60f1db6673c7
--- /dev/null
+++ b/ci/vmtest/configs/run-vmtest.env
@@ -0,0 +1,42 @@
+#!/bin/bash
+
+# This file is sourced by libbpf/ci/run-vmtest Github Action scripts.
+#
+# The primary reason it exists is that assembling ALLOWLIST and
+# DENYLIST for a particular test run is not a trivial operation.
+#
+# Users of libbpf/ci/run-vmtest action need to be able to specify a
+# list of allow/denylist **files**, that later has to be correctly
+# merged into a single allow/denylist passed to a test runner.
+#
+# Obviously it's perferrable for the scripts merging many lists into
+# one to be reusable, and not copy-pasted between repositories which
+# use libbpf/ci actions. And specifying the lists should be trivial.
+# This file is a solution to that.
+
+# $SELFTESTS_BPF and $VMTEST_CONFIGS are set in the workflow, before
+# libbpf/ci/run-vmtest action is called
+# See .github/workflows/kernel-test.yml
+
+ALLOWLIST_FILES=(
+    "${SELFTESTS_BPF}/ALLOWLIST"
+    "${SELFTESTS_BPF}/ALLOWLIST.${ARCH}"
+    "${VMTEST_CONFIGS}/ALLOWLIST"
+    "${VMTEST_CONFIGS}/ALLOWLIST.${ARCH}"
+    "${VMTEST_CONFIGS}/ALLOWLIST.${DEPLOYMENT}"
+    "${VMTEST_CONFIGS}/ALLOWLIST.${KERNEL_TEST}"
+)
+
+DENYLIST_FILES=(
+    "${SELFTESTS_BPF}/DENYLIST"
+    "${SELFTESTS_BPF}/DENYLIST.${ARCH}"
+    "${VMTEST_CONFIGS}/DENYLIST"
+    "${VMTEST_CONFIGS}/DENYLIST.${ARCH}"
+    "${VMTEST_CONFIGS}/DENYLIST.${DEPLOYMENT}"
+    "${VMTEST_CONFIGS}/DENYLIST.${KERNEL_TEST}"
+)
+
+# Export pipe-separated strings, because bash doesn't support array export
+export SELFTESTS_BPF_ALLOWLIST_FILES=$(IFS="|"; echo "${ALLOWLIST_FILES[*]}")
+export SELFTESTS_BPF_DENYLIST_FILES=$(IFS="|"; echo "${DENYLIST_FILES[*]}")
+
diff --git a/ci/vmtest/configs/run_veristat.kernel.cfg b/ci/vmtest/configs/run_veristat.kernel.cfg
new file mode 100644
index 0000000000000..807efc251073f
--- /dev/null
+++ b/ci/vmtest/configs/run_veristat.kernel.cfg
@@ -0,0 +1,4 @@
+VERISTAT_OBJECTS_DIR="${SELFTESTS_BPF}"
+VERISTAT_OBJECTS_GLOB="*.bpf.o"
+VERISTAT_CFG_FILE="${SELFTESTS_BPF}/veristat.cfg"
+VERISTAT_OUTPUT="veristat-kernel"
diff --git a/ci/vmtest/configs/run_veristat.meta.cfg b/ci/vmtest/configs/run_veristat.meta.cfg
new file mode 100644
index 0000000000000..14f08d241d206
--- /dev/null
+++ b/ci/vmtest/configs/run_veristat.meta.cfg
@@ -0,0 +1,4 @@
+VERISTAT_OBJECTS_DIR="${WORKING_DIR}/bpf_objects"
+VERISTAT_OBJECTS_GLOB="*.o"
+VERISTAT_OUTPUT="veristat-meta"
+VERISTAT_CFG_FILE="${VERISTAT_CONFIGS}/veristat_meta.cfg"
diff --git a/ci/vmtest/configs/veristat_meta.cfg b/ci/vmtest/configs/veristat_meta.cfg
new file mode 100644
index 0000000000000..a8c25d71cb9e2
--- /dev/null
+++ b/ci/vmtest/configs/veristat_meta.cfg
@@ -0,0 +1,10 @@
+# List of exceptions we know about that are not going to work with veristat.
+
+# needs 'migrate_misplaced_page' which went away in
+# commit 73eab3ca481e ("mm: migrate: convert migrate_misplaced_page() to migrate_misplaced_folio()")
+!numamove_bpf-numamove_bpf.o
+
+# use non-libbpf loader
+!takeover_bpf_lib-takeover.bpf.o
+!tcp_tuner_bpf_lib-tcptuner.bpf.o
+

From 551b591d4dde47b6d59e8b53b2d3e3bdf0d6ba21 Mon Sep 17 00:00:00 2001
From: Vadim Fedorenko <vadfed@meta.com>
Date: Tue, 18 Mar 2025 10:05:53 -0700
Subject: [PATCH 2/6] bpf: adjust BPF JIT dependency to BPF_SYSCALL

BPF JIT is moving towards optimizing kfuncs and it was long overdue to
switch the dependency. Let's do it now to simplify other patches in the
series.

Signed-off-by: Vadim Fedorenko <vadfed@meta.com>
---
 kernel/bpf/Kconfig | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/kernel/bpf/Kconfig b/kernel/bpf/Kconfig
index 17067dcb43861..528d378195701 100644
--- a/kernel/bpf/Kconfig
+++ b/kernel/bpf/Kconfig
@@ -41,7 +41,7 @@ config BPF_SYSCALL
 
 config BPF_JIT
 	bool "Enable BPF Just In Time compiler"
-	depends on BPF
+	depends on BPF_SYSCALL
 	depends on HAVE_CBPF_JIT || HAVE_EBPF_JIT
 	select EXECMEM
 	help

From 197ea20f89ae4ccd490ac09a4edfb8bf6fbc2b3f Mon Sep 17 00:00:00 2001
From: Vadim Fedorenko <vadfed@meta.com>
Date: Mon, 14 Oct 2024 04:07:13 -0700
Subject: [PATCH 3/6] bpf: add bpf_get_cpu_time_counter kfunc

New kfunc to return ARCH-specific timecounter. The main reason to
implement this kfunc is to avoid extra overhead of benchmark
measurements, which are usually done by a pair of bpf_ktime_get_ns()
at the beginnig and at the end of the code block under benchmark.
When fully JITed this function doesn't implement conversion to the
monotonic clock and saves some CPU cycles by receiving timecounter
values in single-digit amount of instructions. The delta values can be
translated into nanoseconds using kfunc introduced in the next patch.
For x86_64 BPF JIT converts this kfunc into rdtsc ordered call. Other
architectures will get JIT implementation too if supported. The fallback
is to get CLOCK_MONOTONIC_RAW value in ns.

JIT version of the function uses "LFENCE; RDTSC" variant because it
doesn't care about cookie value returned by "RDTSCP" and it doesn't want
to trash RCX value. LFENCE option provides the same ordering guarantee as
RDTSCP variant.

The simplest use-case is added in 5th patch, where we calculate the time
spent by bpf_get_ns_current_pid_tgid() kfunc. More complex example is to
use session cookie to store timecounter value at kprobe/uprobe using
kprobe.session/uprobe.session, and calculate the difference at
kretprobe/uretprobe.

Acked-by: Eduard Zingerman <eddyz87@gmail.com>
Acked-by: Andrii Nakryiko <andrii@kernel.org>
Acked-by: Yonghong Song <yonghong.song@linux.dev>
Signed-off-by: Vadim Fedorenko <vadfed@meta.com>
---
 arch/x86/net/bpf_jit_comp.c   | 43 +++++++++++++++++++++++++++++++++++
 arch/x86/net/bpf_jit_comp32.c |  1 +
 include/linux/bpf.h           |  3 +++
 include/linux/filter.h        |  1 +
 kernel/bpf/core.c             | 11 +++++++++
 kernel/bpf/helpers.c          | 11 +++++++++
 kernel/bpf/verifier.c         |  4 +++-
 7 files changed, 73 insertions(+), 1 deletion(-)

diff --git a/arch/x86/net/bpf_jit_comp.c b/arch/x86/net/bpf_jit_comp.c
index d3491cc0898bf..284696d69df4e 100644
--- a/arch/x86/net/bpf_jit_comp.c
+++ b/arch/x86/net/bpf_jit_comp.c
@@ -15,6 +15,7 @@
 #include <asm/ftrace.h>
 #include <asm/set_memory.h>
 #include <asm/nospec-branch.h>
+#include <asm/timer.h>
 #include <asm/text-patching.h>
 #include <asm/unwind.h>
 #include <asm/cfi.h>
@@ -2254,6 +2255,38 @@ st:			if (is_imm8(insn->off))
 		case BPF_JMP | BPF_CALL: {
 			u8 *ip = image + addrs[i - 1];
 
+			if (insn->src_reg == BPF_PSEUDO_KFUNC_CALL &&
+			    imm32 == BPF_CALL_IMM(bpf_get_cpu_time_counter) &&
+			    bpf_jit_inlines_kfunc_call(imm32)) {
+				/* The default implementation of this kfunc uses
+				 * ktime_get_raw_ns() which effectively is implemented as
+				 * `(u64)rdtsc_ordered() & S64_MAX`. For JIT We skip
+				 * masking part because we assume it's not needed in BPF
+				 * use case (two measurements close in time).
+				 * Original code for rdtsc_ordered() uses sequence:
+				 * 'rdtsc; nop; nop; nop' to patch it into
+				 * 'lfence; rdtsc' or 'rdtscp' depending on CPU features.
+				 * JIT uses 'lfence; rdtsc' variant because BPF program
+				 * doesn't care about cookie provided by rdtscp in RCX.
+				 * Save RDX because RDTSC will use EDX:EAX to return u64
+				 */
+				emit_mov_reg(&prog, true, AUX_REG, BPF_REG_3);
+				if (cpu_feature_enabled(X86_FEATURE_LFENCE_RDTSC))
+					EMIT_LFENCE();
+				EMIT2(0x0F, 0x31);
+
+				/* shl RDX, 32 */
+				maybe_emit_1mod(&prog, BPF_REG_3, true);
+				EMIT3(0xC1, add_1reg(0xE0, BPF_REG_3), 32);
+				/* or RAX, RDX */
+				maybe_emit_mod(&prog, BPF_REG_0, BPF_REG_3, true);
+				EMIT2(0x09, add_2reg(0xC0, BPF_REG_0, BPF_REG_3));
+				/* restore RDX from R11 */
+				emit_mov_reg(&prog, true, BPF_REG_3, AUX_REG);
+
+				break;
+			}
+
 			func = (u8 *) __bpf_call_base + imm32;
 			if (src_reg == BPF_PSEUDO_CALL && tail_call_reachable) {
 				LOAD_TAIL_CALL_CNT_PTR(stack_depth);
@@ -3865,3 +3898,13 @@ bool bpf_jit_supports_timed_may_goto(void)
 {
 	return true;
 }
+
+/* x86-64 JIT can inline kfunc */
+bool bpf_jit_inlines_kfunc_call(s32 imm)
+{
+	if (imm == BPF_CALL_IMM(bpf_get_cpu_time_counter) &&
+	    cpu_feature_enabled(X86_FEATURE_TSC) &&
+	    using_native_sched_clock() && sched_clock_stable())
+		return true;
+	return false;
+}
diff --git a/arch/x86/net/bpf_jit_comp32.c b/arch/x86/net/bpf_jit_comp32.c
index de0f9e5f9f73a..68511888eb27b 100644
--- a/arch/x86/net/bpf_jit_comp32.c
+++ b/arch/x86/net/bpf_jit_comp32.c
@@ -16,6 +16,7 @@
 #include <asm/set_memory.h>
 #include <asm/nospec-branch.h>
 #include <asm/asm-prototypes.h>
+#include <asm/timer.h>
 #include <linux/bpf.h>
 
 /*
diff --git a/include/linux/bpf.h b/include/linux/bpf.h
index 973a88d9b52bc..6cf9138b24371 100644
--- a/include/linux/bpf.h
+++ b/include/linux/bpf.h
@@ -3389,6 +3389,9 @@ void bpf_user_rnd_init_once(void);
 u64 bpf_user_rnd_u32(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
 u64 bpf_get_raw_cpu_id(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
 
+/* Inlined kfuncs */
+u64 bpf_get_cpu_time_counter(void);
+
 #if defined(CONFIG_NET)
 bool bpf_sock_common_is_valid_access(int off, int size,
 				     enum bpf_access_type type,
diff --git a/include/linux/filter.h b/include/linux/filter.h
index 590476743f7a3..2fbfa1bc3f497 100644
--- a/include/linux/filter.h
+++ b/include/linux/filter.h
@@ -1128,6 +1128,7 @@ struct bpf_prog *bpf_int_jit_compile(struct bpf_prog *prog);
 void bpf_jit_compile(struct bpf_prog *prog);
 bool bpf_jit_needs_zext(void);
 bool bpf_jit_inlines_helper_call(s32 imm);
+bool bpf_jit_inlines_kfunc_call(s32 imm);
 bool bpf_jit_supports_subprog_tailcalls(void);
 bool bpf_jit_supports_percpu_insn(void);
 bool bpf_jit_supports_kfunc_call(void);
diff --git a/kernel/bpf/core.c b/kernel/bpf/core.c
index ba6b6118cf504..6ac61b9083cef 100644
--- a/kernel/bpf/core.c
+++ b/kernel/bpf/core.c
@@ -3040,6 +3040,17 @@ bool __weak bpf_jit_inlines_helper_call(s32 imm)
 	return false;
 }
 
+/* Return true if the JIT inlines the call to the kfunc corresponding to
+ * the imm.
+ *
+ * The verifier will not patch the insn->imm for the call to the helper if
+ * this returns true.
+ */
+bool __weak bpf_jit_inlines_kfunc_call(s32 imm)
+{
+	return false;
+}
+
 /* Return TRUE if the JIT backend supports mixing bpf2bpf and tailcalls. */
 bool __weak bpf_jit_supports_subprog_tailcalls(void)
 {
diff --git a/kernel/bpf/helpers.c b/kernel/bpf/helpers.c
index ddaa41a70676c..26f71e2438d2f 100644
--- a/kernel/bpf/helpers.c
+++ b/kernel/bpf/helpers.c
@@ -3195,6 +3195,16 @@ __bpf_kfunc void bpf_local_irq_restore(unsigned long *flags__irq_flag)
 	local_irq_restore(*flags__irq_flag);
 }
 
+__bpf_kfunc u64 bpf_get_cpu_time_counter(void)
+{
+	/* CLOCK_MONOTONIC_RAW is the closest analogue to what is implemented
+	 * in JIT. The access time is the same as for CLOCK_MONOTONIC, but the
+	 * slope of 'raw' is not affected by NTP adjustments, and with stable
+	 * TSC it can provide less jitter in short term measurements.
+	 */
+	return ktime_get_raw_fast_ns();
+}
+
 __bpf_kfunc_end_defs();
 
 BTF_KFUNCS_START(generic_btf_ids)
@@ -3295,6 +3305,7 @@ BTF_ID_FLAGS(func, bpf_iter_kmem_cache_next, KF_ITER_NEXT | KF_RET_NULL | KF_SLE
 BTF_ID_FLAGS(func, bpf_iter_kmem_cache_destroy, KF_ITER_DESTROY | KF_SLEEPABLE)
 BTF_ID_FLAGS(func, bpf_local_irq_save)
 BTF_ID_FLAGS(func, bpf_local_irq_restore)
+BTF_ID_FLAGS(func, bpf_get_cpu_time_counter)
 BTF_KFUNCS_END(common_btf_ids)
 
 static const struct btf_kfunc_id_set common_kfunc_set = {
diff --git a/kernel/bpf/verifier.c b/kernel/bpf/verifier.c
index 9f8cbd5c61bc6..aea1040b44623 100644
--- a/kernel/bpf/verifier.c
+++ b/kernel/bpf/verifier.c
@@ -17077,7 +17077,9 @@ static bool get_call_summary(struct bpf_verifier_env *env, struct bpf_insn *call
 			/* error would be reported later */
 			return false;
 		cs->num_params = btf_type_vlen(meta.func_proto);
-		cs->fastcall = meta.kfunc_flags & KF_FASTCALL;
+		cs->fastcall = (meta.kfunc_flags & KF_FASTCALL) ||
+			       (meta.btf == btf_vmlinux &&
+				bpf_jit_inlines_kfunc_call(call->imm));
 		cs->is_void = btf_type_is_void(btf_type_by_id(meta.btf, meta.func_proto->type));
 		return true;
 	}

From d7349ebe662d941bd660373d5cac603e163c92ee Mon Sep 17 00:00:00 2001
From: Vadim Fedorenko <vadfed@meta.com>
Date: Mon, 28 Oct 2024 11:44:11 -0700
Subject: [PATCH 4/6] bpf: add bpf_cpu_time_counter_to_ns helper

The new helper should be used to convert deltas of values
received by bpf_get_cpu_time_counter() into nanoseconds. It is not
designed to do full conversion of time counter values to
CLOCK_MONOTONIC_RAW nanoseconds and cannot guarantee monotonicity of 2
independent values, but rather to convert the difference of 2 close
enough values of CPU timestamp counter into nanoseconds.

This function is JITted into just several instructions and adds as
low overhead as possible and perfectly suits benchmark use-cases.

When the kfunc is not JITted it returns the value provided as argument
because the kfunc in previous patch will return values in nanoseconds
and can be optimized by verifier.

Reviewed-by: Eduard Zingerman <eddyz87@gmail.com>
Acked-by: Andrii Nakryiko <andrii@kernel.org>
Signed-off-by: Vadim Fedorenko <vadfed@meta.com>
---
 arch/x86/net/bpf_jit_comp.c   | 29 ++++++++++++++++++++++++++++-
 arch/x86/net/bpf_jit_comp32.c |  1 +
 include/linux/bpf.h           |  1 +
 kernel/bpf/helpers.c          |  6 ++++++
 kernel/bpf/verifier.c         |  9 ++++++++-
 5 files changed, 44 insertions(+), 2 deletions(-)

diff --git a/arch/x86/net/bpf_jit_comp.c b/arch/x86/net/bpf_jit_comp.c
index 284696d69df4e..8ff8d7436fc97 100644
--- a/arch/x86/net/bpf_jit_comp.c
+++ b/arch/x86/net/bpf_jit_comp.c
@@ -9,6 +9,7 @@
 #include <linux/filter.h>
 #include <linux/if_vlan.h>
 #include <linux/bpf.h>
+#include <linux/clocksource.h>
 #include <linux/memory.h>
 #include <linux/sort.h>
 #include <asm/extable.h>
@@ -2287,6 +2288,31 @@ st:			if (is_imm8(insn->off))
 				break;
 			}
 
+			if (insn->src_reg == BPF_PSEUDO_KFUNC_CALL &&
+			    imm32 == BPF_CALL_IMM(bpf_cpu_time_counter_to_ns) &&
+			    bpf_jit_inlines_kfunc_call(imm32)) {
+				struct cyc2ns_data data;
+				u32 mult, shift;
+
+				/* stable TSC runs with fixed frequency and
+				 * transformation coefficients are also fixed
+				 */
+				cyc2ns_read_begin(&data);
+				mult = data.cyc2ns_mul;
+				shift = data.cyc2ns_shift;
+				cyc2ns_read_end();
+				/* imul RAX, RDI, mult */
+				maybe_emit_mod(&prog, BPF_REG_1, BPF_REG_0, true);
+				EMIT2_off32(0x69, add_2reg(0xC0, BPF_REG_1, BPF_REG_0),
+					    mult);
+
+				/* shr RAX, shift (which is less than 64) */
+				maybe_emit_1mod(&prog, BPF_REG_0, true);
+				EMIT3(0xC1, add_1reg(0xE8, BPF_REG_0), shift);
+
+				break;
+			}
+
 			func = (u8 *) __bpf_call_base + imm32;
 			if (src_reg == BPF_PSEUDO_CALL && tail_call_reachable) {
 				LOAD_TAIL_CALL_CNT_PTR(stack_depth);
@@ -3902,7 +3928,8 @@ bool bpf_jit_supports_timed_may_goto(void)
 /* x86-64 JIT can inline kfunc */
 bool bpf_jit_inlines_kfunc_call(s32 imm)
 {
-	if (imm == BPF_CALL_IMM(bpf_get_cpu_time_counter) &&
+	if ((imm == BPF_CALL_IMM(bpf_get_cpu_time_counter) ||
+	    imm == BPF_CALL_IMM(bpf_cpu_time_counter_to_ns)) &&
 	    cpu_feature_enabled(X86_FEATURE_TSC) &&
 	    using_native_sched_clock() && sched_clock_stable())
 		return true;
diff --git a/arch/x86/net/bpf_jit_comp32.c b/arch/x86/net/bpf_jit_comp32.c
index 68511888eb27b..83176a07fc08b 100644
--- a/arch/x86/net/bpf_jit_comp32.c
+++ b/arch/x86/net/bpf_jit_comp32.c
@@ -12,6 +12,7 @@
 #include <linux/netdevice.h>
 #include <linux/filter.h>
 #include <linux/if_vlan.h>
+#include <linux/clocksource.h>
 #include <asm/cacheflush.h>
 #include <asm/set_memory.h>
 #include <asm/nospec-branch.h>
diff --git a/include/linux/bpf.h b/include/linux/bpf.h
index 6cf9138b24371..fc03a3805b367 100644
--- a/include/linux/bpf.h
+++ b/include/linux/bpf.h
@@ -3391,6 +3391,7 @@ u64 bpf_get_raw_cpu_id(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
 
 /* Inlined kfuncs */
 u64 bpf_get_cpu_time_counter(void);
+u64 bpf_cpu_time_counter_to_ns(u64 counter);
 
 #if defined(CONFIG_NET)
 bool bpf_sock_common_is_valid_access(int off, int size,
diff --git a/kernel/bpf/helpers.c b/kernel/bpf/helpers.c
index 26f71e2438d2f..a176bd5a33d0a 100644
--- a/kernel/bpf/helpers.c
+++ b/kernel/bpf/helpers.c
@@ -3205,6 +3205,11 @@ __bpf_kfunc u64 bpf_get_cpu_time_counter(void)
 	return ktime_get_raw_fast_ns();
 }
 
+__bpf_kfunc u64 bpf_cpu_time_counter_to_ns(u64 counter)
+{
+	return counter;
+}
+
 __bpf_kfunc_end_defs();
 
 BTF_KFUNCS_START(generic_btf_ids)
@@ -3306,6 +3311,7 @@ BTF_ID_FLAGS(func, bpf_iter_kmem_cache_destroy, KF_ITER_DESTROY | KF_SLEEPABLE)
 BTF_ID_FLAGS(func, bpf_local_irq_save)
 BTF_ID_FLAGS(func, bpf_local_irq_restore)
 BTF_ID_FLAGS(func, bpf_get_cpu_time_counter)
+BTF_ID_FLAGS(func, bpf_cpu_time_counter_to_ns, KF_FASTCALL)
 BTF_KFUNCS_END(common_btf_ids)
 
 static const struct btf_kfunc_id_set common_kfunc_set = {
diff --git a/kernel/bpf/verifier.c b/kernel/bpf/verifier.c
index aea1040b44623..3a908cf24e454 100644
--- a/kernel/bpf/verifier.c
+++ b/kernel/bpf/verifier.c
@@ -12007,6 +12007,7 @@ enum special_kfunc_type {
 	KF_bpf_iter_num_destroy,
 	KF_bpf_set_dentry_xattr,
 	KF_bpf_remove_dentry_xattr,
+	KF_bpf_cpu_time_counter_to_ns,
 };
 
 BTF_SET_START(special_kfunc_set)
@@ -12040,6 +12041,7 @@ BTF_ID(func, bpf_iter_css_task_new)
 BTF_ID(func, bpf_set_dentry_xattr)
 BTF_ID(func, bpf_remove_dentry_xattr)
 #endif
+BTF_ID(func, bpf_cpu_time_counter_to_ns)
 BTF_SET_END(special_kfunc_set)
 
 BTF_ID_LIST(special_kfunc_list)
@@ -12096,6 +12098,7 @@ BTF_ID(func, bpf_remove_dentry_xattr)
 BTF_ID_UNUSED
 BTF_ID_UNUSED
 #endif
+BTF_ID(func, bpf_cpu_time_counter_to_ns)
 
 static bool is_kfunc_ret_null(struct bpf_kfunc_call_arg_meta *meta)
 {
@@ -21246,6 +21249,9 @@ static int fixup_kfunc_call(struct bpf_verifier_env *env, struct bpf_insn *insn,
 
 	if (!bpf_jit_supports_far_kfunc_call())
 		insn->imm = BPF_CALL_IMM(desc->addr);
+	/* if JIT will inline kfunc verifier shouldn't change the code */
+	if (bpf_jit_inlines_kfunc_call(insn->imm))
+		return 0;
 	if (insn->off)
 		return 0;
 	if (desc->func_id == special_kfunc_list[KF_bpf_obj_new_impl] ||
@@ -21310,7 +21316,8 @@ static int fixup_kfunc_call(struct bpf_verifier_env *env, struct bpf_insn *insn,
 		__fixup_collection_insert_kfunc(&env->insn_aux_data[insn_idx], struct_meta_reg,
 						node_offset_reg, insn, insn_buf, cnt);
 	} else if (desc->func_id == special_kfunc_list[KF_bpf_cast_to_kern_ctx] ||
-		   desc->func_id == special_kfunc_list[KF_bpf_rdonly_cast]) {
+		   desc->func_id == special_kfunc_list[KF_bpf_rdonly_cast] ||
+		   desc->func_id == special_kfunc_list[KF_bpf_cpu_time_counter_to_ns]) {
 		insn_buf[0] = BPF_MOV64_REG(BPF_REG_0, BPF_REG_1);
 		*cnt = 1;
 	} else if (is_bpf_wq_set_callback_impl_kfunc(desc->func_id)) {

From c9e602211b8fe096b855000c507c9bf76629c42a Mon Sep 17 00:00:00 2001
From: Vadim Fedorenko <vadfed@meta.com>
Date: Wed, 23 Oct 2024 04:02:01 -0700
Subject: [PATCH 5/6] selftests/bpf: add selftest to check
 bpf_get_cpu_time_counter jit

bpf_get_cpu_time_counter() is replaced with rdtsc instruction on x86_64.
Add tests to check that JIT works as expected.

Acked-by: Eduard Zingerman <eddyz87@gmail.com>
Signed-off-by: Vadim Fedorenko <vadfed@meta.com>
---
 .../selftests/bpf/prog_tests/verifier.c       |   2 +
 .../selftests/bpf/progs/verifier_cpu_cycles.c | 120 ++++++++++++++++++
 2 files changed, 122 insertions(+)
 create mode 100644 tools/testing/selftests/bpf/progs/verifier_cpu_cycles.c

diff --git a/tools/testing/selftests/bpf/prog_tests/verifier.c b/tools/testing/selftests/bpf/prog_tests/verifier.c
index e66a57970d28c..d5e7e302a344f 100644
--- a/tools/testing/selftests/bpf/prog_tests/verifier.c
+++ b/tools/testing/selftests/bpf/prog_tests/verifier.c
@@ -102,6 +102,7 @@
 #include "verifier_xdp_direct_packet_access.skel.h"
 #include "verifier_bits_iter.skel.h"
 #include "verifier_lsm.skel.h"
+#include "verifier_cpu_cycles.skel.h"
 #include "irq.skel.h"
 
 #define MAX_ENTRIES 11
@@ -236,6 +237,7 @@ void test_verifier_bits_iter(void) { RUN(verifier_bits_iter); }
 void test_verifier_lsm(void)                  { RUN(verifier_lsm); }
 void test_irq(void)			      { RUN(irq); }
 void test_verifier_mtu(void)		      { RUN(verifier_mtu); }
+void test_verifier_cpu_cycles(void)	      { RUN(verifier_cpu_cycles); }
 
 static int init_test_val_map(struct bpf_object *obj, char *map_name)
 {
diff --git a/tools/testing/selftests/bpf/progs/verifier_cpu_cycles.c b/tools/testing/selftests/bpf/progs/verifier_cpu_cycles.c
new file mode 100644
index 0000000000000..26c02010ccf1f
--- /dev/null
+++ b/tools/testing/selftests/bpf/progs/verifier_cpu_cycles.c
@@ -0,0 +1,120 @@
+// SPDX-License-Identifier: GPL-2.0
+/* Copyright (c) 2025 Meta Inc. */
+#include "vmlinux.h"
+#include <bpf/bpf_helpers.h>
+#include <bpf/bpf_tracing.h>
+#include "bpf_misc.h"
+
+extern u64 bpf_cpu_time_counter_to_ns(u64 cycles) __weak __ksym;
+extern u64 bpf_get_cpu_time_counter(void) __weak __ksym;
+
+SEC("syscall")
+__arch_x86_64
+__xlated("0: call kernel-function")
+__naked int bpf_rdtsc(void)
+{
+	asm volatile(
+	"call %[bpf_get_cpu_time_counter];"
+	"exit"
+	:
+	: __imm(bpf_get_cpu_time_counter)
+	: __clobber_all
+	);
+}
+
+SEC("syscall")
+__arch_x86_64
+/* program entry for bpf_rdtsc_jit_x86_64(), regular function prologue */
+__jited("	endbr64")
+__jited("	nopl	(%rax,%rax)")
+__jited("	nopl	(%rax)")
+__jited("	pushq	%rbp")
+__jited("	movq	%rsp, %rbp")
+__jited("	endbr64")
+/* save RDX in R11 as it will be overwritten */
+__jited("	movq	%rdx, %r11")
+/* lfence may not be executed depending on cpu features */
+__jited("	{{(lfence|)}}")
+__jited("	rdtsc")
+/* combine EDX:EAX into RAX */
+__jited("	shlq	${{(32|0x20)}}, %rdx")
+__jited("	orq	%rdx, %rax")
+/* restore RDX from R11 */
+__jited("	movq	%r11, %rdx")
+__jited("	leave")
+__naked int bpf_rdtsc_jit_x86_64(void)
+{
+	asm volatile(
+	"call %[bpf_get_cpu_time_counter];"
+	"exit"
+	:
+	: __imm(bpf_get_cpu_time_counter)
+	: __clobber_all
+	);
+}
+
+SEC("syscall")
+__arch_arm64
+__xlated("0: r1 = 42")
+__xlated("1: r0 = r1")
+__naked int bpf_cyc2ns_arm(void)
+{
+	asm volatile(
+	"r1=0x2a;"
+	"call %[bpf_cpu_time_counter_to_ns];"
+	"exit"
+	:
+	: __imm(bpf_cpu_time_counter_to_ns)
+	: __clobber_all
+	);
+}
+
+SEC("syscall")
+__arch_x86_64
+__xlated("0: r1 = 42")
+__xlated("1: call kernel-function")
+__naked int bpf_cyc2ns(void)
+{
+	asm volatile(
+	"r1=0x2a;"
+	"call %[bpf_cpu_time_counter_to_ns];"
+	"exit"
+	:
+	: __imm(bpf_cpu_time_counter_to_ns)
+	: __clobber_all
+	);
+}
+
+SEC("syscall")
+__arch_x86_64
+/* program entry for bpf_rdtsc_jit_x86_64(), regular function prologue */
+__jited("	endbr64")
+__jited("	nopl	(%rax,%rax)")
+__jited("	nopl	(%rax)")
+__jited("	pushq	%rbp")
+__jited("	movq	%rsp, %rbp")
+__jited("	endbr64")
+/* save RDX in R11 as it will be overwritten */
+__jited("	movabsq	$0x2a2a2a2a2a, %rdi")
+__jited("	imulq	${{.*}}, %rdi, %rax")
+__jited("	shrq	${{.*}}, %rax")
+__jited("	leave")
+__naked int bpf_cyc2ns_jit_x86(void)
+{
+	asm volatile(
+	"r1=0x2a2a2a2a2a ll;"
+	"call %[bpf_cpu_time_counter_to_ns];"
+	"exit"
+	:
+	: __imm(bpf_cpu_time_counter_to_ns)
+	: __clobber_all
+	);
+}
+
+void rdtsc(void)
+{
+	bpf_get_cpu_time_counter();
+	bpf_cpu_time_counter_to_ns(42);
+}
+
+char _license[] SEC("license") = "GPL";

From c398e1b0a3c6b5d0d1efdd84243b34030fd7d969 Mon Sep 17 00:00:00 2001
From: Vadim Fedorenko <vadfed@meta.com>
Date: Tue, 29 Oct 2024 10:04:54 -0700
Subject: [PATCH 6/6] selftests/bpf: add usage example for cpu time counter
 kfuncs

The selftest provides an example of how to measure the latency of bpf
kfunc/helper call using time stamp counter and how to convert measured
value into nanoseconds.

Signed-off-by: Vadim Fedorenko <vadfed@meta.com>
---
 .../bpf/prog_tests/test_cpu_cycles.c          | 35 +++++++++++++++++++
 .../selftests/bpf/progs/test_cpu_cycles.c     | 25 +++++++++++++
 2 files changed, 60 insertions(+)
 create mode 100644 tools/testing/selftests/bpf/prog_tests/test_cpu_cycles.c
 create mode 100644 tools/testing/selftests/bpf/progs/test_cpu_cycles.c

diff --git a/tools/testing/selftests/bpf/prog_tests/test_cpu_cycles.c b/tools/testing/selftests/bpf/prog_tests/test_cpu_cycles.c
new file mode 100644
index 0000000000000..067307f0c4c29
--- /dev/null
+++ b/tools/testing/selftests/bpf/prog_tests/test_cpu_cycles.c
@@ -0,0 +1,35 @@
+// SPDX-License-Identifier: GPL-2.0
+/* Copyright (c) 2025 Meta Inc. */
+
+#include <test_progs.h>
+#include "test_cpu_cycles.skel.h"
+
+static void cpu_cycles(void)
+{
+	LIBBPF_OPTS(bpf_test_run_opts, opts);
+	struct test_cpu_cycles *skel;
+	int err, pfd;
+
+	skel = test_cpu_cycles__open_and_load();
+	if (!ASSERT_OK_PTR(skel, "test_cpu_cycles open and load"))
+		return;
+
+	pfd = bpf_program__fd(skel->progs.bpf_cpu_cycles);
+	if (!ASSERT_GT(pfd, 0, "test_cpu_cycles fd"))
+		goto fail;
+
+	err = bpf_prog_test_run_opts(pfd, &opts);
+	if (!ASSERT_OK(err, "test_cpu_cycles test run"))
+		goto fail;
+
+	ASSERT_NEQ(skel->bss->cycles, 0, "test_cpu_cycles 0 cycles");
+	ASSERT_NEQ(skel->bss->ns, 0, "test_cpu_cycles 0 ns");
+fail:
+	test_cpu_cycles__destroy(skel);
+}
+
+void test_cpu_cycles(void)
+{
+	if (test__start_subtest("cpu_cycles"))
+		cpu_cycles();
+}
diff --git a/tools/testing/selftests/bpf/progs/test_cpu_cycles.c b/tools/testing/selftests/bpf/progs/test_cpu_cycles.c
new file mode 100644
index 0000000000000..3c428f3be8310
--- /dev/null
+++ b/tools/testing/selftests/bpf/progs/test_cpu_cycles.c
@@ -0,0 +1,25 @@
+// SPDX-License-Identifier: GPL-2.0
+/* Copyright (c) 2025 Meta Inc. */
+
+#include "vmlinux.h"
+#include <bpf/bpf_helpers.h>
+
+extern u64 bpf_cpu_time_counter_to_ns(u64 cycles) __weak __ksym;
+extern u64 bpf_get_cpu_time_counter(void) __weak __ksym;
+
+__u64 cycles, ns;
+
+SEC("syscall")
+int bpf_cpu_cycles(void)
+{
+	struct bpf_pidns_info pidns;
+	__u64 start;
+
+	start = bpf_get_cpu_time_counter();
+	bpf_get_ns_current_pid_tgid(0, 0, &pidns, sizeof(struct bpf_pidns_info));
+	cycles = bpf_get_cpu_time_counter() - start;
+	ns = bpf_cpu_time_counter_to_ns(cycles);
+	return 0;
+}
+
+char _license[] SEC("license") = "GPL";