Merge git://git.kernel.org/pub/scm/linux/kernel/git/bpf/bpf-next

Minor conflict, a CHECK was placed into an if() statement in net-next, whilst a newline was added to that CHECK call in 'net'. Thanks to Daniel for the merge resolution. Signed-off-by: David S. Miller <davem@davemloft.net>
author: David S. Miller <davem@davemloft.net> 2018-05-07 23:35:08 -0400
committer: David S. Miller <davem@davemloft.net> 2018-05-07 23:35:08 -0400
commit: 01adc4851a8090b46c7a5ed9cfc4b97e65abfbf4 (patch)
tree: 2ae02593d7139962648dff203f3f9701e34ccbc3 /tools
parent: 18b338f5f9539512e76fd9ebd4c6ca1a0e159e2b (diff)
parent: e94fa1d93117e7f1eb783dc9cae6c70650944449 (diff)
20 files changed, 1524 insertions, 128 deletions
diff --git a/tools/bpf/bpftool/Documentation/bpftool-map.rst b/tools/bpf/bpftool/Documentation/bpftool-map.rst
index 5f512b14bff9..a6258bc8ec4f 100644
--- a/tools/bpf/bpftool/Documentation/bpftool-map.rst
+++ b/tools/bpf/bpftool/Documentation/bpftool-map.rst
@@ -22,17 +22,19 @@ MAP COMMANDS
 =============
 |       **bpftool** **map { show | list }**   [*MAP*]
-|       **bpftool** **map dump**    *MAP*
+|       **bpftool** **map dump**       *MAP*
-|       **bpftool** **map update**  *MAP*  **key** [**hex**] *BYTES*   **value** [**hex**] *VALUE* [*UPDATE_FLAGS*]
+|       **bpftool** **map update**     *MAP*  **key** *DATA*   **value** *VALUE* [*UPDATE_FLAGS*]
-|       **bpftool** **map lookup**  *MAP*  **key** [**hex**] *BYTES*
+|       **bpftool** **map lookup**     *MAP*  **key** *DATA*
-|       **bpftool** **map getnext** *MAP* [**key** [**hex**] *BYTES*]
+|       **bpftool** **map getnext**    *MAP* [**key** *DATA*]
-|       **bpftool** **map delete**  *MAP*  **key** [**hex**] *BYTES*
+|       **bpftool** **map delete**     *MAP*  **key** *DATA*
-|       **bpftool** **map pin**     *MAP*  *FILE*
+|       **bpftool** **map pin**        *MAP*  *FILE*
+|       **bpftool** **map event_pipe** *MAP* [**cpu** *N* **index** *M*]
 |       **bpftool** **map help**
 |
 |       *MAP* := { **id** *MAP_ID* | **pinned** *FILE* }
+|       *DATA* := { [**hex**] *BYTES* }
 |       *PROG* := { **id** *PROG_ID* | **pinned** *FILE* | **tag** *PROG_TAG* }
-|       *VALUE* := { *BYTES* | *MAP* | *PROG* }
+|       *VALUE* := { *DATA* | *MAP* | *PROG* }
 |       *UPDATE_FLAGS* := { **any** | **exist** | **noexist** }
 DESCRIPTION
@@ -48,7 +50,7 @@ DESCRIPTION
        **bpftool map dump**    *MAP*
                  Dump all entries in a given *MAP*.
-        **bpftool map update**  *MAP*  **key** [**hex**] *BYTES*   **value** [**hex**] *VALUE* [*UPDATE_FLAGS*]
+        **bpftool map update**  *MAP*  **key** *DATA*   **value** *VALUE* [*UPDATE_FLAGS*]
                  Update map entry for a given *KEY*.
                  *UPDATE_FLAGS* can be one of: **any** update existing entry
@@ -61,13 +63,13 @@ DESCRIPTION
                  the bytes are parsed as decimal values, unless a "0x" prefix
                  (for hexadecimal) or a "0" prefix (for octal) is provided.
-        **bpftool map lookup**  *MAP*  **key** [**hex**] *BYTES*
+        **bpftool map lookup**  *MAP*  **key** *DATA*
                  Lookup **key** in the map.
-        **bpftool map getnext** *MAP* [**key** [**hex**] *BYTES*]
+        **bpftool map getnext** *MAP* [**key** *DATA*]
                  Get next key.  If *key* is not specified, get first key.
-        **bpftool map delete**  *MAP*  **key** [**hex**] *BYTES*
+        **bpftool map delete**  *MAP*  **key** *DATA*
                  Remove entry from the map.
        **bpftool map pin**     *MAP*  *FILE*
@@ -75,6 +77,22 @@ DESCRIPTION
                  Note: *FILE* must be located in *bpffs* mount.
+        **bpftool** **map event_pipe** *MAP* [**cpu** *N* **index** *M*]
+                  Read events from a BPF_MAP_TYPE_PERF_EVENT_ARRAY map.
+                  Install perf rings into a perf event array map and dump
+                  output of any bpf_perf_event_output() call in the kernel.
+                  By default read the number of CPUs on the system and
+                  install perf ring for each CPU in the corresponding index
+                  in the array.
+                  If **cpu** and **index** are specified, install perf ring
+                  for given **cpu** at **index** in the array (single ring).
+                  Note that installing a perf ring into an array will silently
+                  replace any existing ring.  Any other application will stop
+                  receiving events if it installed its rings earlier.
        **bpftool map help**
                  Print short help message.
diff --git a/tools/bpf/bpftool/Documentation/bpftool.rst b/tools/bpf/bpftool/Documentation/bpftool.rst
index 20689a321ffe..564cb0d9692b 100644
--- a/tools/bpf/bpftool/Documentation/bpftool.rst
+++ b/tools/bpf/bpftool/Documentation/bpftool.rst
@@ -23,7 +23,7 @@ SYNOPSIS
        *MAP-COMMANDS* :=
        { **show** | **list** | **dump** | **update** | **lookup** | **getnext** | **delete**
-        | **pin** | **help** }
+        | **pin** | **event_pipe** | **help** }
        *PROG-COMMANDS* := { **show** | **list** | **dump jited** | **dump xlated** | **pin**
        | **load** | **help** }
diff --git a/tools/bpf/bpftool/Makefile b/tools/bpf/bpftool/Makefile
index 4e69782c4a79..892dbf095bff 100644
--- a/tools/bpf/bpftool/Makefile
+++ b/tools/bpf/bpftool/Makefile
@@ -39,7 +39,12 @@ CC = gcc
 CFLAGS += -O2
 CFLAGS += -W -Wall -Wextra -Wno-unused-parameter -Wshadow -Wno-missing-field-initializers
-CFLAGS += -DPACKAGE='"bpftool"' -D__EXPORTED_HEADERS__ -I$(srctree)/tools/include/uapi -I$(srctree)/tools/include -I$(srctree)/tools/lib/bpf -I$(srctree)/kernel/bpf/
+CFLAGS += -DPACKAGE='"bpftool"' -D__EXPORTED_HEADERS__ \
+        -I$(srctree)/kernel/bpf/ \
+        -I$(srctree)/tools/include \
+        -I$(srctree)/tools/include/uapi \
+        -I$(srctree)/tools/lib/bpf \
+        -I$(srctree)/tools/perf
 CFLAGS += -DBPFTOOL_VERSION='"$(BPFTOOL_VERSION)"'
 LIBS = -lelf -lbfd -lopcodes $(LIBBPF)
diff --git a/tools/bpf/bpftool/bash-completion/bpftool b/tools/bpf/bpftool/bash-completion/bpftool
index 852d84a98acd..b301c9b315f1 100644
--- a/tools/bpf/bpftool/bash-completion/bpftool
+++ b/tools/bpf/bpftool/bash-completion/bpftool
@@ -1,6 +1,6 @@
 # bpftool(8) bash completion                               -*- shell-script -*-
 #
-# Copyright (C) 2017 Netronome Systems, Inc.
+# Copyright (C) 2017-2018 Netronome Systems, Inc.
 #
 # This software is dual licensed under the GNU General License
 # Version 2, June 1991 as shown in the file COPYING in the top-level
@@ -79,6 +79,14 @@ _bpftool_get_map_ids()
        command sed -n 's/.*"id": \(.*\),$/\1/p' )" -- "$cur" ) )
 }
+_bpftool_get_perf_map_ids()
+{
+    COMPREPLY+=( $( compgen -W "$( bpftool -jp map  2>&1 | \
+        command grep -C2 perf_event_array | \
+        command sed -n 's/.*"id": \(.*\),$/\1/p' )" -- "$cur" ) )
+}
 _bpftool_get_prog_ids()
 {
    COMPREPLY+=( $( compgen -W "$( bpftool -jp prog 2>&1 | \
@@ -359,10 +367,34 @@ _bpftool()
                    fi
                    return 0
                    ;;
+                event_pipe)
+                    case $prev in
+                        $command)
+                            COMPREPLY=( $( compgen -W "$MAP_TYPE" -- "$cur" ) )
+                            return 0
+                            ;;
+                        id)
+                            _bpftool_get_perf_map_ids
+                            return 0
+                            ;;
+                        cpu)
+                            return 0
+                            ;;
+                        index)
+                            return 0
+                            ;;
+                        *)
+                            _bpftool_once_attr 'cpu'
+                            _bpftool_once_attr 'index'
+                            return 0
+                            ;;
+                    esac
+                    ;;
                *)
                    [[ $prev == $object ]] && \
                        COMPREPLY=( $( compgen -W 'delete dump getnext help \
-                            lookup pin show list update' -- "$cur" ) )
+                            lookup pin event_pipe show list update' -- \
+                            "$cur" ) )
                    ;;
            esac
            ;;
diff --git a/tools/bpf/bpftool/common.c b/tools/bpf/bpftool/common.c
index 465995281dcd..32f9e397a6c0 100644
--- a/tools/bpf/bpftool/common.c
+++ b/tools/bpf/bpftool/common.c
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2017 Netronome Systems, Inc.
+ * Copyright (C) 2017-2018 Netronome Systems, Inc.
 *
 * This software is dual licensed under the GNU General License Version 2,
 * June 1991 as shown in the file COPYING in the top-level directory of this
@@ -33,6 +33,7 @@
 /* Author: Jakub Kicinski <kubakici@wp.pl> */
+#include <ctype.h>
 #include <errno.h>
 #include <fcntl.h>
 #include <fts.h>
@@ -330,6 +331,16 @@ char *get_fdinfo(int fd, const char *key)
        return NULL;
 }
+void print_data_json(uint8_t *data, size_t len)
+{
+        unsigned int i;
+        jsonw_start_array(json_wtr);
+        for (i = 0; i < len; i++)
+                jsonw_printf(json_wtr, "%d", data[i]);
+        jsonw_end_array(json_wtr);
+}
 void print_hex_data_json(uint8_t *data, size_t len)
 {
        unsigned int i;
@@ -420,6 +431,70 @@ void delete_pinned_obj_table(struct pinned_obj_table *tab)
        }
 }
+unsigned int get_page_size(void)
+{
+        static int result;
+        if (!result)
+                result = getpagesize();
+        return result;
+}
+unsigned int get_possible_cpus(void)
+{
+        static unsigned int result;
+        char buf[128];
+        long int n;
+        char *ptr;
+        int fd;
+        if (result)
+                return result;
+        fd = open("/sys/devices/system/cpu/possible", O_RDONLY);
+        if (fd < 0) {
+                p_err("can't open sysfs possible cpus");
+                exit(-1);
+        }
+        n = read(fd, buf, sizeof(buf));
+        if (n < 2) {
+                p_err("can't read sysfs possible cpus");
+                exit(-1);
+        }
+        close(fd);
+        if (n == sizeof(buf)) {
+                p_err("read sysfs possible cpus overflow");
+                exit(-1);
+        }
+        ptr = buf;
+        n = 0;
+        while (*ptr && *ptr != '\n') {
+                unsigned int a, b;
+                if (sscanf(ptr, "%u-%u", &a, &b) == 2) {
+                        n += b - a + 1;
+                        ptr = strchr(ptr, '-') + 1;
+                } else if (sscanf(ptr, "%u", &a) == 1) {
+                        n++;
+                } else {
+                        assert(0);
+                }
+                while (isdigit(*ptr))
+                        ptr++;
+                if (*ptr == ',')
+                        ptr++;
+        }
+        result = n;
+        return result;
+}
 static char *
 ifindex_to_name_ns(__u32 ifindex, __u32 ns_dev, __u32 ns_ino, char *buf)
 {
diff --git a/tools/bpf/bpftool/main.h b/tools/bpf/bpftool/main.h
index b8e9584d6246..6173cd997e7a 100644
--- a/tools/bpf/bpftool/main.h
+++ b/tools/bpf/bpftool/main.h
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2017 Netronome Systems, Inc.
+ * Copyright (C) 2017-2018 Netronome Systems, Inc.
 *
 * This software is dual licensed under the GNU General License Version 2,
 * June 1991 as shown in the file COPYING in the top-level directory of this
@@ -117,14 +117,19 @@ int do_pin_fd(int fd, const char *name);
 int do_prog(int argc, char **arg);
 int do_map(int argc, char **arg);
+int do_event_pipe(int argc, char **argv);
 int do_cgroup(int argc, char **arg);
 int prog_parse_fd(int *argc, char ***argv);
+int map_parse_fd_and_info(int *argc, char ***argv, void *info, __u32 *info_len);
 void disasm_print_insn(unsigned char *image, ssize_t len, int opcodes,
                       const char *arch);
+void print_data_json(uint8_t *data, size_t len);
 void print_hex_data_json(uint8_t *data, size_t len);
+unsigned int get_page_size(void);
+unsigned int get_possible_cpus(void);
 const char *ifindex_to_bfd_name_ns(__u32 ifindex, __u64 ns_dev, __u64 ns_ino);
 #endif
diff --git a/tools/bpf/bpftool/map.c b/tools/bpf/bpftool/map.c
index a6cdb640a0d7..af6766e956ba 100644
--- a/tools/bpf/bpftool/map.c
+++ b/tools/bpf/bpftool/map.c
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2017 Netronome Systems, Inc.
+ * Copyright (C) 2017-2018 Netronome Systems, Inc.
 *
 * This software is dual licensed under the GNU General License Version 2,
 * June 1991 as shown in the file COPYING in the top-level directory of this
@@ -34,7 +34,6 @@
 /* Author: Jakub Kicinski <kubakici@wp.pl> */
 #include <assert.h>
-#include <ctype.h>
 #include <errno.h>
 #include <fcntl.h>
 #include <stdbool.h>
@@ -69,61 +68,6 @@ static const char * const map_type_name[] = {
        [BPF_MAP_TYPE_CPUMAP]           = "cpumap",
 };
-static unsigned int get_possible_cpus(void)
-{
-        static unsigned int result;
-        char buf[128];
-        long int n;
-        char *ptr;
-        int fd;
-        if (result)
-                return result;
-        fd = open("/sys/devices/system/cpu/possible", O_RDONLY);
-        if (fd < 0) {
-                p_err("can't open sysfs possible cpus");
-                exit(-1);
-        }
-        n = read(fd, buf, sizeof(buf));
-        if (n < 2) {
-                p_err("can't read sysfs possible cpus");
-                exit(-1);
-        }
-        close(fd);
-        if (n == sizeof(buf)) {
-                p_err("read sysfs possible cpus overflow");
-                exit(-1);
-        }
-        ptr = buf;
-        n = 0;
-        while (*ptr && *ptr != '\n') {
-                unsigned int a, b;
-                if (sscanf(ptr, "%u-%u", &a, &b) == 2) {
-                        n += b - a + 1;
-                        ptr = strchr(ptr, '-') + 1;
-                } else if (sscanf(ptr, "%u", &a) == 1) {
-                        n++;
-                } else {
-                        assert(0);
-                }
-                while (isdigit(*ptr))
-                        ptr++;
-                if (*ptr == ',')
-                        ptr++;
-        }
-        result = n;
-        return result;
-}
 static bool map_is_per_cpu(__u32 type)
 {
        return type == BPF_MAP_TYPE_PERCPU_HASH ||
@@ -186,8 +130,7 @@ static int map_parse_fd(int *argc, char ***argv)
        return -1;
 }
-static int
+int map_parse_fd_and_info(int *argc, char ***argv, void *info, __u32 *info_len)
-map_parse_fd_and_info(int *argc, char ***argv, void *info, __u32 *info_len)
 {
        int err;
        int fd;
@@ -873,23 +816,25 @@ static int do_help(int argc, char **argv)
        fprintf(stderr,
                "Usage: %s %s { show | list }   [MAP]\n"
-                "       %s %s dump    MAP\n"
+                "       %s %s dump       MAP\n"
-                "       %s %s update  MAP  key [hex] BYTES value [hex] VALUE [UPDATE_FLAGS]\n"
+                "       %s %s update     MAP  key DATA value VALUE [UPDATE_FLAGS]\n"
-                "       %s %s lookup  MAP  key [hex] BYTES\n"
+                "       %s %s lookup     MAP  key DATA\n"
-                "       %s %s getnext MAP [key [hex] BYTES]\n"
+                "       %s %s getnext    MAP [key DATA]\n"
-                "       %s %s delete  MAP  key [hex] BYTES\n"
+                "       %s %s delete     MAP  key DATA\n"
-                "       %s %s pin     MAP  FILE\n"
+                "       %s %s pin        MAP  FILE\n"
+                "       %s %s event_pipe MAP [cpu N index M]\n"
                "       %s %s help\n"
                "\n"
                "       MAP := { id MAP_ID | pinned FILE }\n"
+                "       DATA := { [hex] BYTES }\n"
                "       " HELP_SPEC_PROGRAM "\n"
-                "       VALUE := { BYTES | MAP | PROG }\n"
+                "       VALUE := { DATA | MAP | PROG }\n"
                "       UPDATE_FLAGS := { any | exist | noexist }\n"
                "       " HELP_SPEC_OPTIONS "\n"
                "",
                bin_name, argv[-2], bin_name, argv[-2], bin_name, argv[-2],
                bin_name, argv[-2], bin_name, argv[-2], bin_name, argv[-2],
-                bin_name, argv[-2], bin_name, argv[-2]);
+                bin_name, argv[-2], bin_name, argv[-2], bin_name, argv[-2]);
        return 0;
 }
@@ -904,6 +849,7 @@ static const struct cmd cmds[] = {
        { "getnext",    do_getnext },
        { "delete",     do_delete },
        { "pin",        do_pin },
+        { "event_pipe", do_event_pipe },
        { 0 }
 };
diff --git a/tools/bpf/bpftool/map_perf_ring.c b/tools/bpf/bpftool/map_perf_ring.c
new file mode 100644
index 000000000000..c5a2ced8552d
--- /dev/null
+++ b/tools/bpf/bpftool/map_perf_ring.c
@@ -0,0 +1,347 @@
+// SPDX-License-Identifier: GPL-2.0-only
+/* Copyright (C) 2018 Netronome Systems, Inc. */
+/* This program is free software; you can redistribute it and/or
+ * modify it under the terms of version 2 of the GNU General Public
+ * License as published by the Free Software Foundation.
+ */
+#include <errno.h>
+#include <fcntl.h>
+#include <libbpf.h>
+#include <poll.h>
+#include <signal.h>
+#include <stdbool.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <time.h>
+#include <unistd.h>
+#include <linux/bpf.h>
+#include <linux/perf_event.h>
+#include <sys/ioctl.h>
+#include <sys/mman.h>
+#include <sys/syscall.h>
+#include <bpf.h>
+#include <perf-sys.h>
+#include "main.h"
+#define MMAP_PAGE_CNT   16
+static bool stop;
+struct event_ring_info {
+        int fd;
+        int key;
+        unsigned int cpu;
+        void *mem;
+};
+struct perf_event_sample {
+        struct perf_event_header header;
+        __u32 size;
+        unsigned char data[];
+};
+static void int_exit(int signo)
+{
+        fprintf(stderr, "Stopping...\n");
+        stop = true;
+}
+static void
+print_bpf_output(struct event_ring_info *ring, struct perf_event_sample *e)
+{
+        struct {
+                struct perf_event_header header;
+                __u64 id;
+                __u64 lost;
+        } *lost = (void *)e;
+        struct timespec ts;
+        if (clock_gettime(CLOCK_MONOTONIC, &ts)) {
+                perror("Can't read clock for timestamp");
+                return;
+        }
+        if (json_output) {
+                jsonw_start_object(json_wtr);
+                jsonw_name(json_wtr, "timestamp");
+                jsonw_uint(json_wtr, ts.tv_sec * 1000000000ull + ts.tv_nsec);
+                jsonw_name(json_wtr, "type");
+                jsonw_uint(json_wtr, e->header.type);
+                jsonw_name(json_wtr, "cpu");
+                jsonw_uint(json_wtr, ring->cpu);
+                jsonw_name(json_wtr, "index");
+                jsonw_uint(json_wtr, ring->key);
+                if (e->header.type == PERF_RECORD_SAMPLE) {
+                        jsonw_name(json_wtr, "data");
+                        print_data_json(e->data, e->size);
+                } else if (e->header.type == PERF_RECORD_LOST) {
+                        jsonw_name(json_wtr, "lost");
+                        jsonw_start_object(json_wtr);
+                        jsonw_name(json_wtr, "id");
+                        jsonw_uint(json_wtr, lost->id);
+                        jsonw_name(json_wtr, "count");
+                        jsonw_uint(json_wtr, lost->lost);
+                        jsonw_end_object(json_wtr);
+                }
+                jsonw_end_object(json_wtr);
+        } else {
+                if (e->header.type == PERF_RECORD_SAMPLE) {
+                        printf("== @%ld.%ld CPU: %d index: %d =====\n",
+                               (long)ts.tv_sec, ts.tv_nsec,
+                               ring->cpu, ring->key);
+                        fprint_hex(stdout, e->data, e->size, " ");
+                        printf("\n");
+                } else if (e->header.type == PERF_RECORD_LOST) {
+                        printf("lost %lld events\n", lost->lost);
+                } else {
+                        printf("unknown event type=%d size=%d\n",
+                               e->header.type, e->header.size);
+                }
+        }
+}
+static void
+perf_event_read(struct event_ring_info *ring, void **buf, size_t *buf_len)
+{
+        volatile struct perf_event_mmap_page *header = ring->mem;
+        __u64 buffer_size = MMAP_PAGE_CNT * get_page_size();
+        __u64 data_tail = header->data_tail;
+        __u64 data_head = header->data_head;
+        void *base, *begin, *end;
+        asm volatile("" ::: "memory"); /* in real code it should be smp_rmb() */
+        if (data_head == data_tail)
+                return;
+        base = ((char *)header) + get_page_size();
+        begin = base + data_tail % buffer_size;
+        end = base + data_head % buffer_size;
+        while (begin != end) {
+                struct perf_event_sample *e;
+                e = begin;
+                if (begin + e->header.size > base + buffer_size) {
+                        long len = base + buffer_size - begin;
+                        if (*buf_len < e->header.size) {
+                                free(*buf);
+                                *buf = malloc(e->header.size);
+                                if (!*buf) {
+                                        fprintf(stderr,
+                                                "can't allocate memory");
+                                        stop = true;
+                                        return;
+                                }
+                                *buf_len = e->header.size;
+                        }
+                        memcpy(*buf, begin, len);
+                        memcpy(*buf + len, base, e->header.size - len);
+                        e = (void *)*buf;
+                        begin = base + e->header.size - len;
+                } else if (begin + e->header.size == base + buffer_size) {
+                        begin = base;
+                } else {
+                        begin += e->header.size;
+                }
+                print_bpf_output(ring, e);
+        }
+        __sync_synchronize(); /* smp_mb() */
+        header->data_tail = data_head;
+}
+static int perf_mmap_size(void)
+{
+        return get_page_size() * (MMAP_PAGE_CNT + 1);
+}
+static void *perf_event_mmap(int fd)
+{
+        int mmap_size = perf_mmap_size();
+        void *base;
+        base = mmap(NULL, mmap_size, PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0);
+        if (base == MAP_FAILED) {
+                p_err("event mmap failed: %s\n", strerror(errno));
+                return NULL;
+        }
+        return base;
+}
+static void perf_event_unmap(void *mem)
+{
+        if (munmap(mem, perf_mmap_size()))
+                fprintf(stderr, "Can't unmap ring memory!\n");
+}
+static int bpf_perf_event_open(int map_fd, int key, int cpu)
+{
+        struct perf_event_attr attr = {
+                .sample_type = PERF_SAMPLE_RAW,
+                .type = PERF_TYPE_SOFTWARE,
+                .config = PERF_COUNT_SW_BPF_OUTPUT,
+        };
+        int pmu_fd;
+        pmu_fd = sys_perf_event_open(&attr, -1, cpu, -1, 0);
+        if (pmu_fd < 0) {
+                p_err("failed to open perf event %d for CPU %d", key, cpu);
+                return -1;
+        }
+        if (bpf_map_update_elem(map_fd, &key, &pmu_fd, BPF_ANY)) {
+                p_err("failed to update map for event %d for CPU %d", key, cpu);
+                goto err_close;
+        }
+        if (ioctl(pmu_fd, PERF_EVENT_IOC_ENABLE, 0)) {
+                p_err("failed to enable event %d for CPU %d", key, cpu);
+                goto err_close;
+        }
+        return pmu_fd;
+err_close:
+        close(pmu_fd);
+        return -1;
+}
+int do_event_pipe(int argc, char **argv)
+{
+        int i, nfds, map_fd, index = -1, cpu = -1;
+        struct bpf_map_info map_info = {};
+        struct event_ring_info *rings;
+        size_t tmp_buf_sz = 0;
+        void *tmp_buf = NULL;
+        struct pollfd *pfds;
+        __u32 map_info_len;
+        bool do_all = true;
+        map_info_len = sizeof(map_info);
+        map_fd = map_parse_fd_and_info(&argc, &argv, &map_info, &map_info_len);
+        if (map_fd < 0)
+                return -1;
+        if (map_info.type != BPF_MAP_TYPE_PERF_EVENT_ARRAY) {
+                p_err("map is not a perf event array");
+                goto err_close_map;
+        }
+        while (argc) {
+                if (argc < 2)
+                        BAD_ARG();
+                if (is_prefix(*argv, "cpu")) {
+                        char *endptr;
+                        NEXT_ARG();
+                        cpu = strtoul(*argv, &endptr, 0);
+                        if (*endptr) {
+                                p_err("can't parse %s as CPU ID", **argv);
+                                goto err_close_map;
+                        }
+                        NEXT_ARG();
+                } else if (is_prefix(*argv, "index")) {
+                        char *endptr;
+                        NEXT_ARG();
+                        index = strtoul(*argv, &endptr, 0);
+                        if (*endptr) {
+                                p_err("can't parse %s as index", **argv);
+                                goto err_close_map;
+                        }
+                        NEXT_ARG();
+                } else {
+                        BAD_ARG();
+                }
+                do_all = false;
+        }
+        if (!do_all) {
+                if (index == -1 || cpu == -1) {
+                        p_err("cpu and index must be specified together");
+                        goto err_close_map;
+                }
+                nfds = 1;
+        } else {
+                nfds = min(get_possible_cpus(), map_info.max_entries);
+                cpu = 0;
+                index = 0;
+        }
+        rings = calloc(nfds, sizeof(rings[0]));
+        if (!rings)
+                goto err_close_map;
+        pfds = calloc(nfds, sizeof(pfds[0]));
+        if (!pfds)
+                goto err_free_rings;
+        for (i = 0; i < nfds; i++) {
+                rings[i].cpu = cpu + i;
+                rings[i].key = index + i;
+                rings[i].fd = bpf_perf_event_open(map_fd, rings[i].key,
+                                                  rings[i].cpu);
+                if (rings[i].fd < 0)
+                        goto err_close_fds_prev;
+                rings[i].mem = perf_event_mmap(rings[i].fd);
+                if (!rings[i].mem)
+                        goto err_close_fds_current;
+                pfds[i].fd = rings[i].fd;
+                pfds[i].events = POLLIN;
+        }
+        signal(SIGINT, int_exit);
+        signal(SIGHUP, int_exit);
+        signal(SIGTERM, int_exit);
+        if (json_output)
+                jsonw_start_array(json_wtr);
+        while (!stop) {
+                poll(pfds, nfds, 200);
+                for (i = 0; i < nfds; i++)
+                        perf_event_read(&rings[i], &tmp_buf, &tmp_buf_sz);
+        }
+        free(tmp_buf);
+        if (json_output)
+                jsonw_end_array(json_wtr);
+        for (i = 0; i < nfds; i++) {
+                perf_event_unmap(rings[i].mem);
+                close(rings[i].fd);
+        }
+        free(pfds);
+        free(rings);
+        close(map_fd);
+        return 0;
+err_close_fds_prev:
+        while (i--) {
+                perf_event_unmap(rings[i].mem);
+err_close_fds_current:
+                close(rings[i].fd);
+        }
+        free(pfds);
+err_free_rings:
+        free(rings);
+err_close_map:
+        close(map_fd);
+        return -1;
+}
diff --git a/tools/bpf/bpftool/prog.c b/tools/bpf/bpftool/prog.c
index e71a0a11afde..9bdfdf2d3fbe 100644
--- a/tools/bpf/bpftool/prog.c
+++ b/tools/bpf/bpftool/prog.c
@@ -96,7 +96,10 @@ static void print_boot_time(__u64 nsecs, char *buf, unsigned int size)
                return;
        }
-        strftime(buf, size, "%b %d/%H:%M", &load_tm);
+        if (json_output)
+                strftime(buf, size, "%s", &load_tm);
+        else
+                strftime(buf, size, "%FT%T%z", &load_tm);
 }
 static int prog_fd_by_tag(unsigned char *tag)
@@ -245,7 +248,8 @@ static void print_prog_json(struct bpf_prog_info *info, int fd)
                print_boot_time(info->load_time, buf, sizeof(buf));
                /* Piggy back on load_time, since 0 uid is a valid one */
-                jsonw_string_field(json_wtr, "loaded_at", buf);
+                jsonw_name(json_wtr, "loaded_at");
+                jsonw_printf(json_wtr, "%s", buf);
                jsonw_uint_field(json_wtr, "uid", info->created_by_uid);
        }
diff --git a/tools/include/uapi/linux/bpf.h b/tools/include/uapi/linux/bpf.h
index da77a9388947..83a95ae388dd 100644
--- a/tools/include/uapi/linux/bpf.h
+++ b/tools/include/uapi/linux/bpf.h
@@ -828,12 +828,12 @@ union bpf_attr {
 *
 *              Also, be aware that the newer helper
 *              **bpf_perf_event_read_value**\ () is recommended over
- *              **bpf_perf_event_read*\ () in general. The latter has some ABI
+ *              **bpf_perf_event_read**\ () in general. The latter has some ABI
 *              quirks where error and counter value are used as a return code
 *              (which is wrong to do since ranges may overlap). This issue is
- *              fixed with bpf_perf_event_read_value(), which at the same time
+ *              fixed with **bpf_perf_event_read_value**\ (), which at the same
- *              provides more features over the **bpf_perf_event_read**\ ()
+ *              time provides more features over the **bpf_perf_event_read**\
- *              interface. Please refer to the description of
+ *              () interface. Please refer to the description of
 *              **bpf_perf_event_read_value**\ () for details.
 *      Return
 *              The value of the perf event counter read from the map, or a
@@ -1361,7 +1361,7 @@ union bpf_attr {
 *      Return
 *              0
 *
- * int bpf_setsockopt(struct bpf_sock_ops_kern *bpf_socket, int level, int optname, char *optval, int optlen)
+ * int bpf_setsockopt(struct bpf_sock_ops *bpf_socket, int level, int optname, char *optval, int optlen)
 *      Description
 *              Emulate a call to **setsockopt()** on the socket associated to
 *              *bpf_socket*, which must be a full socket. The *level* at
@@ -1435,7 +1435,7 @@ union bpf_attr {
 *      Return
 *              **SK_PASS** on success, or **SK_DROP** on error.
 *
- * int bpf_sock_map_update(struct bpf_sock_ops_kern *skops, struct bpf_map *map, void *key, u64 flags)
+ * int bpf_sock_map_update(struct bpf_sock_ops *skops, struct bpf_map *map, void *key, u64 flags)
 *      Description
 *              Add an entry to, or update a *map* referencing sockets. The
 *              *skops* is used as a new value for the entry associated to
@@ -1533,7 +1533,7 @@ union bpf_attr {
 *      Return
 *              0 on success, or a negative error in case of failure.
 *
- * int bpf_perf_prog_read_value(struct bpf_perf_event_data_kern *ctx, struct bpf_perf_event_value *buf, u32 buf_size)
+ * int bpf_perf_prog_read_value(struct bpf_perf_event_data *ctx, struct bpf_perf_event_value *buf, u32 buf_size)
 *      Description
 *              For en eBPF program attached to a perf event, retrieve the
 *              value of the event counter associated to *ctx* and store it in
@@ -1544,7 +1544,7 @@ union bpf_attr {
 *      Return
 *              0 on success, or a negative error in case of failure.
 *
- * int bpf_getsockopt(struct bpf_sock_ops_kern *bpf_socket, int level, int optname, char *optval, int optlen)
+ * int bpf_getsockopt(struct bpf_sock_ops *bpf_socket, int level, int optname, char *optval, int optlen)
 *      Description
 *              Emulate a call to **getsockopt()** on the socket associated to
 *              *bpf_socket*, which must be a full socket. The *level* at
@@ -1588,7 +1588,7 @@ union bpf_attr {
 *      Return
 *              0
 *
- * int bpf_sock_ops_cb_flags_set(struct bpf_sock_ops_kern *bpf_sock, int argval)
+ * int bpf_sock_ops_cb_flags_set(struct bpf_sock_ops *bpf_sock, int argval)
 *      Description
 *              Attempt to set the value of the **bpf_sock_ops_cb_flags** field
 *              for the full TCP socket associated to *bpf_sock_ops* to
@@ -1721,7 +1721,7 @@ union bpf_attr {
 *      Return
 *              0 on success, or a negative error in case of failure.
 *
- * int bpf_bind(struct bpf_sock_addr_kern *ctx, struct sockaddr *addr, int addr_len)
+ * int bpf_bind(struct bpf_sock_addr *ctx, struct sockaddr *addr, int addr_len)
 *      Description
 *              Bind the socket associated to *ctx* to the address pointed by
 *              *addr*, of length *addr_len*. This allows for making outgoing
@@ -1767,6 +1767,64 @@ union bpf_attr {
 *              **CONFIG_XFRM** configuration option.
 *      Return
 *              0 on success, or a negative error in case of failure.
+ *
+ * int bpf_get_stack(struct pt_regs *regs, void *buf, u32 size, u64 flags)
+ *      Description
+ *              Return a user or a kernel stack in bpf program provided buffer.
+ *              To achieve this, the helper needs *ctx*, which is a pointer
+ *              to the context on which the tracing program is executed.
+ *              To store the stacktrace, the bpf program provides *buf* with
+ *              a nonnegative *size*.
+ *
+ *              The last argument, *flags*, holds the number of stack frames to
+ *              skip (from 0 to 255), masked with
+ *              **BPF_F_SKIP_FIELD_MASK**. The next bits can be used to set
+ *              the following flags:
+ *
+ *              **BPF_F_USER_STACK**
+ *                      Collect a user space stack instead of a kernel stack.
+ *              **BPF_F_USER_BUILD_ID**
+ *                      Collect buildid+offset instead of ips for user stack,
+ *                      only valid if **BPF_F_USER_STACK** is also specified.
+ *
+ *              **bpf_get_stack**\ () can collect up to
+ *              **PERF_MAX_STACK_DEPTH** both kernel and user frames, subject
+ *              to sufficient large buffer size. Note that
+ *              this limit can be controlled with the **sysctl** program, and
+ *              that it should be manually increased in order to profile long
+ *              user stacks (such as stacks for Java programs). To do so, use:
+ *
+ *              ::
+ *
+ *                      # sysctl kernel.perf_event_max_stack=<new value>
+ *
+ *      Return
+ *              a non-negative value equal to or less than size on success, or
+ *              a negative error in case of failure.
+ *
+ * int skb_load_bytes_relative(const struct sk_buff *skb, u32 offset, void *to, u32 len, u32 start_header)
+ *      Description
+ *              This helper is similar to **bpf_skb_load_bytes**\ () in that
+ *              it provides an easy way to load *len* bytes from *offset*
+ *              from the packet associated to *skb*, into the buffer pointed
+ *              by *to*. The difference to **bpf_skb_load_bytes**\ () is that
+ *              a fifth argument *start_header* exists in order to select a
+ *              base offset to start from. *start_header* can be one of:
+ *
+ *              **BPF_HDR_START_MAC**
+ *                      Base offset to load data from is *skb*'s mac header.
+ *              **BPF_HDR_START_NET**
+ *                      Base offset to load data from is *skb*'s network header.
+ *
+ *              In general, "direct packet access" is the preferred method to
+ *              access packet data, however, this helper is in particular useful
+ *              in socket filters where *skb*\ **->data** does not always point
+ *              to the start of the mac header and where "direct packet access"
+ *              is not available.
+ *
+ *      Return
+ *              0 on success, or a negative error in case of failure.
+ *
 */
 #define __BPF_FUNC_MAPPER(FN)           \
        FN(unspec),                     \
@@ -1835,7 +1893,9 @@ union bpf_attr {
        FN(msg_pull_data),              \
        FN(bind),                       \
        FN(xdp_adjust_tail),            \
-        FN(skb_get_xfrm_state),
+        FN(skb_get_xfrm_state),         \
+        FN(get_stack),                  \
+        FN(skb_load_bytes_relative),
 /* integer value in 'imm' field of BPF_CALL instruction selects which helper
 * function eBPF program intends to call
@@ -1869,11 +1929,14 @@ enum bpf_func_id {
 /* BPF_FUNC_skb_set_tunnel_key and BPF_FUNC_skb_get_tunnel_key flags. */
 #define BPF_F_TUNINFO_IPV6              (1ULL << 0)
-/* BPF_FUNC_get_stackid flags. */
+/* flags for both BPF_FUNC_get_stackid and BPF_FUNC_get_stack. */
 #define BPF_F_SKIP_FIELD_MASK           0xffULL
 #define BPF_F_USER_STACK                (1ULL << 8)
+/* flags used by BPF_FUNC_get_stackid only. */
 #define BPF_F_FAST_STACK_CMP            (1ULL << 9)
 #define BPF_F_REUSE_STACKID             (1ULL << 10)
+/* flags used by BPF_FUNC_get_stack only. */
+#define BPF_F_USER_BUILD_ID             (1ULL << 11)
 /* BPF_FUNC_skb_set_tunnel_key flags. */
 #define BPF_F_ZERO_CSUM_TX              (1ULL << 1)
@@ -1893,6 +1956,12 @@ enum bpf_adj_room_mode {
        BPF_ADJ_ROOM_NET,
 };
+/* Mode for BPF_FUNC_skb_load_bytes_relative helper. */
+enum bpf_hdr_start_off {
+        BPF_HDR_START_MAC,
+        BPF_HDR_START_NET,
+};
 /* user accessible mirror of in-kernel sk_buff.
 * new fields can only be added to the end of this structure
 */
diff --git a/tools/include/uapi/linux/erspan.h b/tools/include/uapi/linux/erspan.h
new file mode 100644
index 000000000000..841573019ae1
--- /dev/null
+++ b/tools/include/uapi/linux/erspan.h
@@ -0,0 +1,52 @@
+/* SPDX-License-Identifier: GPL-2.0 WITH Linux-syscall-note */
+/*
+ * ERSPAN Tunnel Metadata
+ *
+ * Copyright (c) 2018 VMware
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License version 2
+ * as published by the Free Software Foundation.
+ *
+ * Userspace API for metadata mode ERSPAN tunnel
+ */
+#ifndef _UAPI_ERSPAN_H
+#define _UAPI_ERSPAN_H
+#include <linux/types.h>        /* For __beXX in userspace */
+#include <asm/byteorder.h>
+/* ERSPAN version 2 metadata header */
+struct erspan_md2 {
+        __be32 timestamp;
+        __be16 sgt;     /* security group tag */
+#if defined(__LITTLE_ENDIAN_BITFIELD)
+        __u8    hwid_upper:2,
+                ft:5,
+                p:1;
+        __u8    o:1,
+                gra:2,
+                dir:1,
+                hwid:4;
+#elif defined(__BIG_ENDIAN_BITFIELD)
+        __u8    p:1,
+                ft:5,
+                hwid_upper:2;
+        __u8    hwid:4,
+                dir:1,
+                gra:2,
+                o:1;
+#else
+#error "Please fix <asm/byteorder.h>"
+#endif
+};
+struct erspan_metadata {
+        int version;
+        union {
+                __be32 index;           /* Version 1 (type II)*/
+                struct erspan_md2 md2;  /* Version 2 (type III) */
+        } u;
+};
+#endif /* _UAPI_ERSPAN_H */
diff --git a/tools/testing/selftests/bpf/Makefile b/tools/testing/selftests/bpf/Makefile
index b64a7a39cbc8..9d762184b805 100644
--- a/tools/testing/selftests/bpf/Makefile
+++ b/tools/testing/selftests/bpf/Makefile
@@ -32,7 +32,8 @@ TEST_GEN_FILES = test_pkt_access.o test_xdp.o test_l4lb.o test_tcp_estats.o test
        test_l4lb_noinline.o test_xdp_noinline.o test_stacktrace_map.o \
        sample_map_ret0.o test_tcpbpf_kern.o test_stacktrace_build_id.o \
        sockmap_tcp_msg_prog.o connect4_prog.o connect6_prog.o test_adjust_tail.o \
-        test_btf_haskv.o test_btf_nokv.o test_sockmap_kern.o test_tunnel_kern.o
+        test_btf_haskv.o test_btf_nokv.o test_sockmap_kern.o test_tunnel_kern.o \
+        test_get_stack_rawtp.o
 # Order correspond to 'make run_tests' order
 TEST_PROGS := test_kmod.sh \
@@ -58,6 +59,7 @@ $(OUTPUT)/test_dev_cgroup: cgroup_helpers.c
 $(OUTPUT)/test_sock: cgroup_helpers.c
 $(OUTPUT)/test_sock_addr: cgroup_helpers.c
 $(OUTPUT)/test_sockmap: cgroup_helpers.c
+$(OUTPUT)/test_progs: trace_helpers.c
 .PHONY: force
diff --git a/tools/testing/selftests/bpf/bpf_helpers.h b/tools/testing/selftests/bpf/bpf_helpers.h
index 69d7b918e66a..265f8e0e8ada 100644
--- a/tools/testing/selftests/bpf/bpf_helpers.h
+++ b/tools/testing/selftests/bpf/bpf_helpers.h
@@ -101,6 +101,8 @@ static int (*bpf_xdp_adjust_tail)(void *ctx, int offset) =
 static int (*bpf_skb_get_xfrm_state)(void *ctx, int index, void *state,
                                     int size, int flags) =
        (void *) BPF_FUNC_skb_get_xfrm_state;
+static int (*bpf_get_stack)(void *ctx, void *buf, int size, int flags) =
+        (void *) BPF_FUNC_get_stack;
 /* llvm builtin functions that eBPF C program may use to
 * emit BPF_LD_ABS and BPF_LD_IND instructions
diff --git a/tools/testing/selftests/bpf/test_get_stack_rawtp.c b/tools/testing/selftests/bpf/test_get_stack_rawtp.c
new file mode 100644
index 000000000000..f6d9f238e00a
--- /dev/null
+++ b/tools/testing/selftests/bpf/test_get_stack_rawtp.c
@@ -0,0 +1,102 @@
+// SPDX-License-Identifier: GPL-2.0
+#include <linux/bpf.h>
+#include "bpf_helpers.h"
+/* Permit pretty deep stack traces */
+#define MAX_STACK_RAWTP 100
+struct stack_trace_t {
+        int pid;
+        int kern_stack_size;
+        int user_stack_size;
+        int user_stack_buildid_size;
+        __u64 kern_stack[MAX_STACK_RAWTP];
+        __u64 user_stack[MAX_STACK_RAWTP];
+        struct bpf_stack_build_id user_stack_buildid[MAX_STACK_RAWTP];
+};
+struct bpf_map_def SEC("maps") perfmap = {
+        .type = BPF_MAP_TYPE_PERF_EVENT_ARRAY,
+        .key_size = sizeof(int),
+        .value_size = sizeof(__u32),
+        .max_entries = 2,
+};
+struct bpf_map_def SEC("maps") stackdata_map = {
+        .type = BPF_MAP_TYPE_PERCPU_ARRAY,
+        .key_size = sizeof(__u32),
+        .value_size = sizeof(struct stack_trace_t),
+        .max_entries = 1,
+};
+/* Allocate per-cpu space twice the needed. For the code below
+ *   usize = bpf_get_stack(ctx, raw_data, max_len, BPF_F_USER_STACK);
+ *   if (usize < 0)
+ *     return 0;
+ *   ksize = bpf_get_stack(ctx, raw_data + usize, max_len - usize, 0);
+ *
+ * If we have value_size = MAX_STACK_RAWTP * sizeof(__u64),
+ * verifier will complain that access "raw_data + usize"
+ * with size "max_len - usize" may be out of bound.
+ * The maximum "raw_data + usize" is "raw_data + max_len"
+ * and the maximum "max_len - usize" is "max_len", verifier
+ * concludes that the maximum buffer access range is
+ * "raw_data[0...max_len * 2 - 1]" and hence reject the program.
+ *
+ * Doubling the to-be-used max buffer size can fix this verifier
+ * issue and avoid complicated C programming massaging.
+ * This is an acceptable workaround since there is one entry here.
+ */
+struct bpf_map_def SEC("maps") rawdata_map = {
+        .type = BPF_MAP_TYPE_PERCPU_ARRAY,
+        .key_size = sizeof(__u32),
+        .value_size = MAX_STACK_RAWTP * sizeof(__u64) * 2,
+        .max_entries = 1,
+};
+SEC("tracepoint/raw_syscalls/sys_enter")
+int bpf_prog1(void *ctx)
+{
+        int max_len, max_buildid_len, usize, ksize, total_size;
+        struct stack_trace_t *data;
+        void *raw_data;
+        __u32 key = 0;
+        data = bpf_map_lookup_elem(&stackdata_map, &key);
+        if (!data)
+                return 0;
+        max_len = MAX_STACK_RAWTP * sizeof(__u64);
+        max_buildid_len = MAX_STACK_RAWTP * sizeof(struct bpf_stack_build_id);
+        data->pid = bpf_get_current_pid_tgid();
+        data->kern_stack_size = bpf_get_stack(ctx, data->kern_stack,
+                                              max_len, 0);
+        data->user_stack_size = bpf_get_stack(ctx, data->user_stack, max_len,
+                                            BPF_F_USER_STACK);
+        data->user_stack_buildid_size = bpf_get_stack(
+                ctx, data->user_stack_buildid, max_buildid_len,
+                BPF_F_USER_STACK | BPF_F_USER_BUILD_ID);
+        bpf_perf_event_output(ctx, &perfmap, 0, data, sizeof(*data));
+        /* write both kernel and user stacks to the same buffer */
+        raw_data = bpf_map_lookup_elem(&rawdata_map, &key);
+        if (!raw_data)
+                return 0;
+        usize = bpf_get_stack(ctx, raw_data, max_len, BPF_F_USER_STACK);
+        if (usize < 0)
+                return 0;
+        ksize = bpf_get_stack(ctx, raw_data + usize, max_len - usize, 0);
+        if (ksize < 0)
+                return 0;
+        total_size = usize + ksize;
+        if (total_size > 0 && total_size <= max_len)
+                bpf_perf_event_output(ctx, &perfmap, 0, raw_data, total_size);
+        return 0;
+}
+char _license[] SEC("license") = "GPL";
+__u32 _version SEC("version") = 1; /* ignored by tracepoints, required by libbpf.a */
diff --git a/tools/testing/selftests/bpf/test_progs.c b/tools/testing/selftests/bpf/test_progs.c
index fac581f1c57f..ed197eef1cfc 100644
--- a/tools/testing/selftests/bpf/test_progs.c
+++ b/tools/testing/selftests/bpf/test_progs.c
@@ -38,8 +38,10 @@ typedef __u16 __sum16;
 #include "bpf_util.h"
 #include "bpf_endian.h"
 #include "bpf_rlimit.h"
+#include "trace_helpers.h"
 static int error_cnt, pass_cnt;
+static bool jit_enabled;
 #define MAGIC_BYTES 123
@@ -391,13 +393,30 @@ static inline __u64 ptr_to_u64(const void *ptr)
        return (__u64) (unsigned long) ptr;
 }
+static bool is_jit_enabled(void)
+{
+        const char *jit_sysctl = "/proc/sys/net/core/bpf_jit_enable";
+        bool enabled = false;
+        int sysctl_fd;
+        sysctl_fd = open(jit_sysctl, 0, O_RDONLY);
+        if (sysctl_fd != -1) {
+                char tmpc;
+                if (read(sysctl_fd, &tmpc, sizeof(tmpc)) == 1)
+                        enabled = (tmpc != '0');
+                close(sysctl_fd);
+        }
+        return enabled;
+}
 static void test_bpf_obj_id(void)
 {
        const __u64 array_magic_value = 0xfaceb00c;
        const __u32 array_key = 0;
        const int nr_iters = 2;
        const char *file = "./test_obj_id.o";
-        const char *jit_sysctl = "/proc/sys/net/core/bpf_jit_enable";
        const char *expected_prog_name = "test_obj_id";
        const char *expected_map_name = "test_map_id";
        const __u64 nsec_per_sec = 1000000000;
@@ -414,20 +433,11 @@ static void test_bpf_obj_id(void)
        char jited_insns[128], xlated_insns[128], zeros[128];
        __u32 i, next_id, info_len, nr_id_found, duration = 0;
        struct timespec real_time_ts, boot_time_ts;
-        int sysctl_fd, jit_enabled = 0, err = 0;
+        int err = 0;
        __u64 array_value;
        uid_t my_uid = getuid();
        time_t now, load_time;
-        sysctl_fd = open(jit_sysctl, 0, O_RDONLY);
-        if (sysctl_fd != -1) {
-                char tmpc;
-                if (read(sysctl_fd, &tmpc, sizeof(tmpc)) == 1)
-                        jit_enabled = (tmpc != '0');
-                close(sysctl_fd);
-        }
        err = bpf_prog_get_fd_by_id(0);
        CHECK(err >= 0 || errno != ENOENT,
              "get-fd-by-notexist-prog-id", "err %d errno %d\n", err, errno);
@@ -896,11 +906,47 @@ static int compare_map_keys(int map1_fd, int map2_fd)
        return 0;
 }
+static int compare_stack_ips(int smap_fd, int amap_fd, int stack_trace_len)
+{
+        __u32 key, next_key, *cur_key_p, *next_key_p;
+        char *val_buf1, *val_buf2;
+        int i, err = 0;
+        val_buf1 = malloc(stack_trace_len);
+        val_buf2 = malloc(stack_trace_len);
+        cur_key_p = NULL;
+        next_key_p = &key;
+        while (bpf_map_get_next_key(smap_fd, cur_key_p, next_key_p) == 0) {
+                err = bpf_map_lookup_elem(smap_fd, next_key_p, val_buf1);
+                if (err)
+                        goto out;
+                err = bpf_map_lookup_elem(amap_fd, next_key_p, val_buf2);
+                if (err)
+                        goto out;
+                for (i = 0; i < stack_trace_len; i++) {
+                        if (val_buf1[i] != val_buf2[i]) {
+                                err = -1;
+                                goto out;
+                        }
+                }
+                key = *next_key_p;
+                cur_key_p = &key;
+                next_key_p = &next_key;
+        }
+        if (errno != ENOENT)
+                err = -1;
+out:
+        free(val_buf1);
+        free(val_buf2);
+        return err;
+}
 static void test_stacktrace_map()
 {
-        int control_map_fd, stackid_hmap_fd, stackmap_fd;
+        int control_map_fd, stackid_hmap_fd, stackmap_fd, stack_amap_fd;
        const char *file = "./test_stacktrace_map.o";
-        int bytes, efd, err, pmu_fd, prog_fd;
+        int bytes, efd, err, pmu_fd, prog_fd, stack_trace_len;
        struct perf_event_attr attr = {};
        __u32 key, val, duration = 0;
        struct bpf_object *obj;
@@ -956,6 +1002,10 @@ static void test_stacktrace_map()
        if (stackmap_fd < 0)
                goto disable_pmu;
+        stack_amap_fd = bpf_find_map(__func__, obj, "stack_amap");
+        if (stack_amap_fd < 0)
+                goto disable_pmu;
        /* give some time for bpf program run */
        sleep(1);
@@ -977,6 +1027,12 @@ static void test_stacktrace_map()
                  "err %d errno %d\n", err, errno))
                goto disable_pmu_noerr;
+        stack_trace_len = PERF_MAX_STACK_DEPTH * sizeof(__u64);
+        err = compare_stack_ips(stackmap_fd, stack_amap_fd, stack_trace_len);
+        if (CHECK(err, "compare_stack_ips stackmap vs. stack_amap",
+                  "err %d errno %d\n", err, errno))
+                goto disable_pmu_noerr;
        goto disable_pmu_noerr;
 disable_pmu:
        error_cnt++;
@@ -1070,9 +1126,9 @@ err:
 static void test_stacktrace_build_id(void)
 {
-        int control_map_fd, stackid_hmap_fd, stackmap_fd;
+        int control_map_fd, stackid_hmap_fd, stackmap_fd, stack_amap_fd;
        const char *file = "./test_stacktrace_build_id.o";
-        int bytes, efd, err, pmu_fd, prog_fd;
+        int bytes, efd, err, pmu_fd, prog_fd, stack_trace_len;
        struct perf_event_attr attr = {};
        __u32 key, previous_key, val, duration = 0;
        struct bpf_object *obj;
@@ -1137,6 +1193,11 @@ static void test_stacktrace_build_id(void)
                  err, errno))
                goto disable_pmu;
+        stack_amap_fd = bpf_find_map(__func__, obj, "stack_amap");
+        if (CHECK(stack_amap_fd < 0, "bpf_find_map stack_amap",
+                  "err %d errno %d\n", err, errno))
+                goto disable_pmu;
        assert(system("dd if=/dev/urandom of=/dev/zero count=4 2> /dev/null")
               == 0);
        assert(system("./urandom_read") == 0);
@@ -1188,8 +1249,15 @@ static void test_stacktrace_build_id(void)
                previous_key = key;
        } while (bpf_map_get_next_key(stackmap_fd, &previous_key, &key) == 0);
-        CHECK(build_id_matches < 1, "build id match",
+        if (CHECK(build_id_matches < 1, "build id match",
-              "Didn't find expected build ID from the map\n");
+                  "Didn't find expected build ID from the map\n"))
+                goto disable_pmu;
+        stack_trace_len = PERF_MAX_STACK_DEPTH
+                * sizeof(struct bpf_stack_build_id);
+        err = compare_stack_ips(stackmap_fd, stack_amap_fd, stack_trace_len);
+        CHECK(err, "compare_stack_ips stackmap vs. stack_amap",
+              "err %d errno %d\n", err, errno);
 disable_pmu:
        ioctl(pmu_fd, PERF_EVENT_IOC_DISABLE);
@@ -1204,8 +1272,147 @@ out:
        return;
 }
+#define MAX_CNT_RAWTP   10ull
+#define MAX_STACK_RAWTP 100
+struct get_stack_trace_t {
+        int pid;
+        int kern_stack_size;
+        int user_stack_size;
+        int user_stack_buildid_size;
+        __u64 kern_stack[MAX_STACK_RAWTP];
+        __u64 user_stack[MAX_STACK_RAWTP];
+        struct bpf_stack_build_id user_stack_buildid[MAX_STACK_RAWTP];
+};
+static int get_stack_print_output(void *data, int size)
+{
+        bool good_kern_stack = false, good_user_stack = false;
+        const char *nonjit_func = "___bpf_prog_run";
+        struct get_stack_trace_t *e = data;
+        int i, num_stack;
+        static __u64 cnt;
+        struct ksym *ks;
+        cnt++;
+        if (size < sizeof(struct get_stack_trace_t)) {
+                __u64 *raw_data = data;
+                bool found = false;
+                num_stack = size / sizeof(__u64);
+                /* If jit is enabled, we do not have a good way to
+                 * verify the sanity of the kernel stack. So we
+                 * just assume it is good if the stack is not empty.
+                 * This could be improved in the future.
+                 */
+                if (jit_enabled) {
+                        found = num_stack > 0;
+                } else {
+                        for (i = 0; i < num_stack; i++) {
+                                ks = ksym_search(raw_data[i]);
+                                if (strcmp(ks->name, nonjit_func) == 0) {
+                                        found = true;
+                                        break;
+                                }
+                        }
+                }
+                if (found) {
+                        good_kern_stack = true;
+                        good_user_stack = true;
+                }
+        } else {
+                num_stack = e->kern_stack_size / sizeof(__u64);
+                if (jit_enabled) {
+                        good_kern_stack = num_stack > 0;
+                } else {
+                        for (i = 0; i < num_stack; i++) {
+                                ks = ksym_search(e->kern_stack[i]);
+                                if (strcmp(ks->name, nonjit_func) == 0) {
+                                        good_kern_stack = true;
+                                        break;
+                                }
+                        }
+                }
+                if (e->user_stack_size > 0 && e->user_stack_buildid_size > 0)
+                        good_user_stack = true;
+        }
+        if (!good_kern_stack || !good_user_stack)
+                return PERF_EVENT_ERROR;
+        if (cnt == MAX_CNT_RAWTP)
+                return PERF_EVENT_DONE;
+        return PERF_EVENT_CONT;
+}
+static void test_get_stack_raw_tp(void)
+{
+        const char *file = "./test_get_stack_rawtp.o";
+        int i, efd, err, prog_fd, pmu_fd, perfmap_fd;
+        struct perf_event_attr attr = {};
+        struct timespec tv = {0, 10};
+        __u32 key = 0, duration = 0;
+        struct bpf_object *obj;
+        err = bpf_prog_load(file, BPF_PROG_TYPE_RAW_TRACEPOINT, &obj, &prog_fd);
+        if (CHECK(err, "prog_load raw tp", "err %d errno %d\n", err, errno))
+                return;
+        efd = bpf_raw_tracepoint_open("sys_enter", prog_fd);
+        if (CHECK(efd < 0, "raw_tp_open", "err %d errno %d\n", efd, errno))
+                goto close_prog;
+        perfmap_fd = bpf_find_map(__func__, obj, "perfmap");
+        if (CHECK(perfmap_fd < 0, "bpf_find_map", "err %d errno %d\n",
+                  perfmap_fd, errno))
+                goto close_prog;
+        err = load_kallsyms();
+        if (CHECK(err < 0, "load_kallsyms", "err %d errno %d\n", err, errno))
+                goto close_prog;
+        attr.sample_type = PERF_SAMPLE_RAW;
+        attr.type = PERF_TYPE_SOFTWARE;
+        attr.config = PERF_COUNT_SW_BPF_OUTPUT;
+        pmu_fd = syscall(__NR_perf_event_open, &attr, getpid()/*pid*/, -1/*cpu*/,
+                         -1/*group_fd*/, 0);
+        if (CHECK(pmu_fd < 0, "perf_event_open", "err %d errno %d\n", pmu_fd,
+                  errno))
+                goto close_prog;
+        err = bpf_map_update_elem(perfmap_fd, &key, &pmu_fd, BPF_ANY);
+        if (CHECK(err < 0, "bpf_map_update_elem", "err %d errno %d\n", err,
+                  errno))
+                goto close_prog;
+        err = ioctl(pmu_fd, PERF_EVENT_IOC_ENABLE, 0);
+        if (CHECK(err < 0, "ioctl PERF_EVENT_IOC_ENABLE", "err %d errno %d\n",
+                  err, errno))
+                goto close_prog;
+        err = perf_event_mmap(pmu_fd);
+        if (CHECK(err < 0, "perf_event_mmap", "err %d errno %d\n", err, errno))
+                goto close_prog;
+        /* trigger some syscall action */
+        for (i = 0; i < MAX_CNT_RAWTP; i++)
+                nanosleep(&tv, NULL);
+        err = perf_event_poller(pmu_fd, get_stack_print_output);
+        if (CHECK(err < 0, "perf_event_poller", "err %d errno %d\n", err, errno))
+                goto close_prog;
+        goto close_prog_noerr;
+close_prog:
+        error_cnt++;
+close_prog_noerr:
+        bpf_object__close(obj);
+}
 int main(void)
 {
+        jit_enabled = is_jit_enabled();
        test_pkt_access();
        test_xdp();
        test_xdp_adjust_tail();
@@ -1219,6 +1426,7 @@ int main(void)
        test_stacktrace_map();
        test_stacktrace_build_id();
        test_stacktrace_map_raw_tp();
+        test_get_stack_raw_tp();
        printf("Summary: %d PASSED, %d FAILED\n", pass_cnt, error_cnt);
        return error_cnt ? EXIT_FAILURE : EXIT_SUCCESS;
diff --git a/tools/testing/selftests/bpf/test_stacktrace_build_id.c b/tools/testing/selftests/bpf/test_stacktrace_build_id.c
index b755bd783ce5..d86c281e957f 100644
--- a/tools/testing/selftests/bpf/test_stacktrace_build_id.c
+++ b/tools/testing/selftests/bpf/test_stacktrace_build_id.c
@@ -19,7 +19,7 @@ struct bpf_map_def SEC("maps") stackid_hmap = {
        .type = BPF_MAP_TYPE_HASH,
        .key_size = sizeof(__u32),
        .value_size = sizeof(__u32),
-        .max_entries = 10000,
+        .max_entries = 16384,
 };
 struct bpf_map_def SEC("maps") stackmap = {
@@ -31,6 +31,14 @@ struct bpf_map_def SEC("maps") stackmap = {
        .map_flags = BPF_F_STACK_BUILD_ID,
 };
+struct bpf_map_def SEC("maps") stack_amap = {
+        .type = BPF_MAP_TYPE_ARRAY,
+        .key_size = sizeof(__u32),
+        .value_size = sizeof(struct bpf_stack_build_id)
+                * PERF_MAX_STACK_DEPTH,
+        .max_entries = 128,
+};
 /* taken from /sys/kernel/debug/tracing/events/random/urandom_read/format */
 struct random_urandom_args {
        unsigned long long pad;
@@ -42,7 +50,10 @@ struct random_urandom_args {
 SEC("tracepoint/random/urandom_read")
 int oncpu(struct random_urandom_args *args)
 {
+        __u32 max_len = sizeof(struct bpf_stack_build_id)
+                        * PERF_MAX_STACK_DEPTH;
        __u32 key = 0, val = 0, *value_p;
+        void *stack_p;
        value_p = bpf_map_lookup_elem(&control_map, &key);
        if (value_p && *value_p)
@@ -50,8 +61,13 @@ int oncpu(struct random_urandom_args *args)
        /* The size of stackmap and stackid_hmap should be the same */
        key = bpf_get_stackid(args, &stackmap, BPF_F_USER_STACK);
-        if ((int)key >= 0)
+        if ((int)key >= 0) {
                bpf_map_update_elem(&stackid_hmap, &key, &val, 0);
+                stack_p = bpf_map_lookup_elem(&stack_amap, &key);
+                if (stack_p)
+                        bpf_get_stack(args, stack_p, max_len,
+                                      BPF_F_USER_STACK | BPF_F_USER_BUILD_ID);
+        }
        return 0;
 }
diff --git a/tools/testing/selftests/bpf/test_stacktrace_map.c b/tools/testing/selftests/bpf/test_stacktrace_map.c
index 76d85c5d08bd..af111af7ca1a 100644
--- a/tools/testing/selftests/bpf/test_stacktrace_map.c
+++ b/tools/testing/selftests/bpf/test_stacktrace_map.c
@@ -19,14 +19,21 @@ struct bpf_map_def SEC("maps") stackid_hmap = {
        .type = BPF_MAP_TYPE_HASH,
        .key_size = sizeof(__u32),
        .value_size = sizeof(__u32),
-        .max_entries = 10000,
+        .max_entries = 16384,
 };
 struct bpf_map_def SEC("maps") stackmap = {
        .type = BPF_MAP_TYPE_STACK_TRACE,
        .key_size = sizeof(__u32),
        .value_size = sizeof(__u64) * PERF_MAX_STACK_DEPTH,
-        .max_entries = 10000,
+        .max_entries = 16384,
+};
+struct bpf_map_def SEC("maps") stack_amap = {
+        .type = BPF_MAP_TYPE_ARRAY,
+        .key_size = sizeof(__u32),
+        .value_size = sizeof(__u64) * PERF_MAX_STACK_DEPTH,
+        .max_entries = 16384,
 };
 /* taken from /sys/kernel/debug/tracing/events/sched/sched_switch/format */
@@ -44,7 +51,9 @@ struct sched_switch_args {
 SEC("tracepoint/sched/sched_switch")
 int oncpu(struct sched_switch_args *ctx)
 {
+        __u32 max_len = PERF_MAX_STACK_DEPTH * sizeof(__u64);
        __u32 key = 0, val = 0, *value_p;
+        void *stack_p;
        value_p = bpf_map_lookup_elem(&control_map, &key);
        if (value_p && *value_p)
@@ -52,8 +61,12 @@ int oncpu(struct sched_switch_args *ctx)
        /* The size of stackmap and stackid_hmap should be the same */
        key = bpf_get_stackid(ctx, &stackmap, 0);
-        if ((int)key >= 0)
+        if ((int)key >= 0) {
                bpf_map_update_elem(&stackid_hmap, &key, &val, 0);
+                stack_p = bpf_map_lookup_elem(&stack_amap, &key);
+                if (stack_p)
+                        bpf_get_stack(ctx, stack_p, max_len, 0);
+        }
        return 0;
 }
diff --git a/tools/testing/selftests/bpf/test_verifier.c b/tools/testing/selftests/bpf/test_verifier.c
index 165e9ddfa446..275b4570b5b8 100644
--- a/tools/testing/selftests/bpf/test_verifier.c
+++ b/tools/testing/selftests/bpf/test_verifier.c
@@ -47,7 +47,7 @@
 # define ARRAY_SIZE(x) (sizeof(x) / sizeof((x)[0]))
 #endif
-#define MAX_INSNS       512
+#define MAX_INSNS       BPF_MAXINSNS
 #define MAX_FIXUPS      8
 #define MAX_NR_MAPS     4
 #define POINTER_VALUE   0xcafe4all
@@ -77,6 +77,8 @@ struct bpf_test {
        } result, result_unpriv;
        enum bpf_prog_type prog_type;
        uint8_t flags;
+        __u8 data[TEST_DATA_LEN];
+        void (*fill_helper)(struct bpf_test *self);
 };
 /* Note we want this to be 64 bit aligned so that the end of our array is
@@ -94,6 +96,62 @@ struct other_val {
        long long bar;
 };
+static void bpf_fill_ld_abs_vlan_push_pop(struct bpf_test *self)
+{
+        /* test: {skb->data[0], vlan_push} x 68 + {skb->data[0], vlan_pop} x 68 */
+#define PUSH_CNT 51
+        unsigned int len = BPF_MAXINSNS;
+        struct bpf_insn *insn = self->insns;
+        int i = 0, j, k = 0;
+        insn[i++] = BPF_MOV64_REG(BPF_REG_6, BPF_REG_1);
+loop:
+        for (j = 0; j < PUSH_CNT; j++) {
+                insn[i++] = BPF_LD_ABS(BPF_B, 0);
+                insn[i] = BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0x34, len - i - 2);
+                i++;
+                insn[i++] = BPF_MOV64_REG(BPF_REG_1, BPF_REG_6);
+                insn[i++] = BPF_MOV64_IMM(BPF_REG_2, 1);
+                insn[i++] = BPF_MOV64_IMM(BPF_REG_3, 2);
+                insn[i++] = BPF_RAW_INSN(BPF_JMP | BPF_CALL, 0, 0, 0,
+                                         BPF_FUNC_skb_vlan_push),
+                insn[i] = BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0, len - i - 2);
+                i++;
+        }
+        for (j = 0; j < PUSH_CNT; j++) {
+                insn[i++] = BPF_LD_ABS(BPF_B, 0);
+                insn[i] = BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0x34, len - i - 2);
+                i++;
+                insn[i++] = BPF_MOV64_REG(BPF_REG_1, BPF_REG_6);
+                insn[i++] = BPF_RAW_INSN(BPF_JMP | BPF_CALL, 0, 0, 0,
+                                         BPF_FUNC_skb_vlan_pop),
+                insn[i] = BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0, len - i - 2);
+                i++;
+        }
+        if (++k < 5)
+                goto loop;
+        for (; i < len - 1; i++)
+                insn[i] = BPF_ALU32_IMM(BPF_MOV, BPF_REG_0, 0xbef);
+        insn[len - 1] = BPF_EXIT_INSN();
+}
+static void bpf_fill_jump_around_ld_abs(struct bpf_test *self)
+{
+        struct bpf_insn *insn = self->insns;
+        unsigned int len = BPF_MAXINSNS;
+        int i = 0;
+        insn[i++] = BPF_MOV64_REG(BPF_REG_6, BPF_REG_1);
+        insn[i++] = BPF_LD_ABS(BPF_B, 0);
+        insn[i] = BPF_JMP_IMM(BPF_JEQ, BPF_REG_0, 10, len - i - 2);
+        i++;
+        while (i < len - 1)
+                insn[i++] = BPF_LD_ABS(BPF_B, 1);
+        insn[i] = BPF_EXIT_INSN();
+}
 static struct bpf_test tests[] = {
        {
                "add+sub+mul",
@@ -11680,6 +11738,242 @@ static struct bpf_test tests[] = {
                .errstr = "BPF_XADD stores into R2 packet",
                .prog_type = BPF_PROG_TYPE_XDP,
        },
+        {
+                "bpf_get_stack return R0 within range",
+                .insns = {
+                        BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
+                        BPF_ST_MEM(BPF_DW, BPF_REG_10, -8, 0),
+                        BPF_MOV64_REG(BPF_REG_2, BPF_REG_10),
+                        BPF_ALU64_IMM(BPF_ADD, BPF_REG_2, -8),
+                        BPF_LD_MAP_FD(BPF_REG_1, 0),
+                        BPF_RAW_INSN(BPF_JMP | BPF_CALL, 0, 0, 0,
+                                     BPF_FUNC_map_lookup_elem),
+                        BPF_JMP_IMM(BPF_JEQ, BPF_REG_0, 0, 28),
+                        BPF_MOV64_REG(BPF_REG_7, BPF_REG_0),
+                        BPF_MOV64_IMM(BPF_REG_9, sizeof(struct test_val)),
+                        BPF_MOV64_REG(BPF_REG_1, BPF_REG_6),
+                        BPF_MOV64_REG(BPF_REG_2, BPF_REG_7),
+                        BPF_MOV64_IMM(BPF_REG_3, sizeof(struct test_val)),
+                        BPF_MOV64_IMM(BPF_REG_4, 256),
+                        BPF_EMIT_CALL(BPF_FUNC_get_stack),
+                        BPF_MOV64_IMM(BPF_REG_1, 0),
+                        BPF_MOV64_REG(BPF_REG_8, BPF_REG_0),
+                        BPF_ALU64_IMM(BPF_LSH, BPF_REG_8, 32),
+                        BPF_ALU64_IMM(BPF_ARSH, BPF_REG_8, 32),
+                        BPF_JMP_REG(BPF_JSLT, BPF_REG_1, BPF_REG_8, 16),
+                        BPF_ALU64_REG(BPF_SUB, BPF_REG_9, BPF_REG_8),
+                        BPF_MOV64_REG(BPF_REG_2, BPF_REG_7),
+                        BPF_ALU64_REG(BPF_ADD, BPF_REG_2, BPF_REG_8),
+                        BPF_MOV64_REG(BPF_REG_1, BPF_REG_9),
+                        BPF_ALU64_IMM(BPF_LSH, BPF_REG_1, 32),
+                        BPF_ALU64_IMM(BPF_ARSH, BPF_REG_1, 32),
+                        BPF_MOV64_REG(BPF_REG_3, BPF_REG_2),
+                        BPF_ALU64_REG(BPF_ADD, BPF_REG_3, BPF_REG_1),
+                        BPF_MOV64_REG(BPF_REG_1, BPF_REG_7),
+                        BPF_MOV64_IMM(BPF_REG_5, sizeof(struct test_val)),
+                        BPF_ALU64_REG(BPF_ADD, BPF_REG_1, BPF_REG_5),
+                        BPF_JMP_REG(BPF_JGE, BPF_REG_3, BPF_REG_1, 4),
+                        BPF_MOV64_REG(BPF_REG_1, BPF_REG_6),
+                        BPF_MOV64_REG(BPF_REG_3, BPF_REG_9),
+                        BPF_MOV64_IMM(BPF_REG_4, 0),
+                        BPF_EMIT_CALL(BPF_FUNC_get_stack),
+                        BPF_EXIT_INSN(),
+                },
+                .fixup_map2 = { 4 },
+                .result = ACCEPT,
+                .prog_type = BPF_PROG_TYPE_TRACEPOINT,
+        },
+        {
+                "ld_abs: invalid op 1",
+                .insns = {
+                        BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
+                        BPF_LD_ABS(BPF_DW, 0),
+                        BPF_EXIT_INSN(),
+                },
+                .prog_type = BPF_PROG_TYPE_SCHED_CLS,
+                .result = REJECT,
+                .errstr = "unknown opcode",
+        },
+        {
+                "ld_abs: invalid op 2",
+                .insns = {
+                        BPF_MOV32_IMM(BPF_REG_0, 256),
+                        BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
+                        BPF_LD_IND(BPF_DW, BPF_REG_0, 0),
+                        BPF_EXIT_INSN(),
+                },
+                .prog_type = BPF_PROG_TYPE_SCHED_CLS,
+                .result = REJECT,
+                .errstr = "unknown opcode",
+        },
+        {
+                "ld_abs: nmap reduced",
+                .insns = {
+                        BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
+                        BPF_LD_ABS(BPF_H, 12),
+                        BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0x806, 28),
+                        BPF_LD_ABS(BPF_H, 12),
+                        BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0x806, 26),
+                        BPF_MOV32_IMM(BPF_REG_0, 18),
+                        BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_0, -64),
+                        BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_10, -64),
+                        BPF_LD_IND(BPF_W, BPF_REG_7, 14),
+                        BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_0, -60),
+                        BPF_MOV32_IMM(BPF_REG_0, 280971478),
+                        BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_0, -56),
+                        BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_10, -56),
+                        BPF_LDX_MEM(BPF_W, BPF_REG_0, BPF_REG_10, -60),
+                        BPF_ALU32_REG(BPF_SUB, BPF_REG_0, BPF_REG_7),
+                        BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0, 15),
+                        BPF_LD_ABS(BPF_H, 12),
+                        BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0x806, 13),
+                        BPF_MOV32_IMM(BPF_REG_0, 22),
+                        BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_0, -56),
+                        BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_10, -56),
+                        BPF_LD_IND(BPF_H, BPF_REG_7, 14),
+                        BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_0, -52),
+                        BPF_MOV32_IMM(BPF_REG_0, 17366),
+                        BPF_STX_MEM(BPF_W, BPF_REG_10, BPF_REG_0, -48),
+                        BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_10, -48),
+                        BPF_LDX_MEM(BPF_W, BPF_REG_0, BPF_REG_10, -52),
+                        BPF_ALU32_REG(BPF_SUB, BPF_REG_0, BPF_REG_7),
+                        BPF_JMP_IMM(BPF_JNE, BPF_REG_0, 0, 2),
+                        BPF_MOV32_IMM(BPF_REG_0, 256),
+                        BPF_EXIT_INSN(),
+                        BPF_MOV32_IMM(BPF_REG_0, 0),
+                        BPF_EXIT_INSN(),
+                },
+                .data = {
+                        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0x08, 0x06, 0,
+                        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+                        0x10, 0xbf, 0x48, 0xd6, 0x43, 0xd6,
+                },
+                .prog_type = BPF_PROG_TYPE_SCHED_CLS,
+                .result = ACCEPT,
+                .retval = 256,
+        },
+        {
+                "ld_abs: div + abs, test 1",
+                .insns = {
+                        BPF_ALU64_REG(BPF_MOV, BPF_REG_6, BPF_REG_1),
+                        BPF_LD_ABS(BPF_B, 3),
+                        BPF_ALU64_IMM(BPF_MOV, BPF_REG_2, 2),
+                        BPF_ALU32_REG(BPF_DIV, BPF_REG_0, BPF_REG_2),
+                        BPF_ALU64_REG(BPF_MOV, BPF_REG_8, BPF_REG_0),
+                        BPF_LD_ABS(BPF_B, 4),
+                        BPF_ALU64_REG(BPF_ADD, BPF_REG_8, BPF_REG_0),
+                        BPF_LD_IND(BPF_B, BPF_REG_8, -70),
+                        BPF_EXIT_INSN(),
+                },
+                .data = {
+                        10, 20, 30, 40, 50,
+                },
+                .prog_type = BPF_PROG_TYPE_SCHED_CLS,
+                .result = ACCEPT,
+                .retval = 10,
+        },
+        {
+                "ld_abs: div + abs, test 2",
+                .insns = {
+                        BPF_ALU64_REG(BPF_MOV, BPF_REG_6, BPF_REG_1),
+                        BPF_LD_ABS(BPF_B, 3),
+                        BPF_ALU64_IMM(BPF_MOV, BPF_REG_2, 2),
+                        BPF_ALU32_REG(BPF_DIV, BPF_REG_0, BPF_REG_2),
+                        BPF_ALU64_REG(BPF_MOV, BPF_REG_8, BPF_REG_0),
+                        BPF_LD_ABS(BPF_B, 128),
+                        BPF_ALU64_REG(BPF_ADD, BPF_REG_8, BPF_REG_0),
+                        BPF_LD_IND(BPF_B, BPF_REG_8, -70),
+                        BPF_EXIT_INSN(),
+                },
+                .data = {
+                        10, 20, 30, 40, 50,
+                },
+                .prog_type = BPF_PROG_TYPE_SCHED_CLS,
+                .result = ACCEPT,
+                .retval = 0,
+        },
+        {
+                "ld_abs: div + abs, test 3",
+                .insns = {
+                        BPF_ALU64_REG(BPF_MOV, BPF_REG_6, BPF_REG_1),
+                        BPF_ALU64_IMM(BPF_MOV, BPF_REG_7, 0),
+                        BPF_LD_ABS(BPF_B, 3),
+                        BPF_ALU32_REG(BPF_DIV, BPF_REG_0, BPF_REG_7),
+                        BPF_EXIT_INSN(),
+                },
+                .data = {
+                        10, 20, 30, 40, 50,
+                },
+                .prog_type = BPF_PROG_TYPE_SCHED_CLS,
+                .result = ACCEPT,
+                .retval = 0,
+        },
+        {
+                "ld_abs: div + abs, test 4",
+                .insns = {
+                        BPF_ALU64_REG(BPF_MOV, BPF_REG_6, BPF_REG_1),
+                        BPF_ALU64_IMM(BPF_MOV, BPF_REG_7, 0),
+                        BPF_LD_ABS(BPF_B, 256),
+                        BPF_ALU32_REG(BPF_DIV, BPF_REG_0, BPF_REG_7),
+                        BPF_EXIT_INSN(),
+                },
+                .data = {
+                        10, 20, 30, 40, 50,
+                },
+                .prog_type = BPF_PROG_TYPE_SCHED_CLS,
+                .result = ACCEPT,
+                .retval = 0,
+        },
+        {
+                "ld_abs: vlan + abs, test 1",
+                .insns = { },
+                .data = {
+                        0x34,
+                },
+                .fill_helper = bpf_fill_ld_abs_vlan_push_pop,
+                .prog_type = BPF_PROG_TYPE_SCHED_CLS,
+                .result = ACCEPT,
+                .retval = 0xbef,
+        },
+        {
+                "ld_abs: vlan + abs, test 2",
+                .insns = {
+                        BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
+                        BPF_LD_ABS(BPF_B, 0),
+                        BPF_LD_ABS(BPF_H, 0),
+                        BPF_LD_ABS(BPF_W, 0),
+                        BPF_MOV64_REG(BPF_REG_7, BPF_REG_6),
+                        BPF_MOV64_IMM(BPF_REG_6, 0),
+                        BPF_MOV64_REG(BPF_REG_1, BPF_REG_7),
+                        BPF_MOV64_IMM(BPF_REG_2, 1),
+                        BPF_MOV64_IMM(BPF_REG_3, 2),
+                        BPF_RAW_INSN(BPF_JMP | BPF_CALL, 0, 0, 0,
+                                     BPF_FUNC_skb_vlan_push),
+                        BPF_MOV64_REG(BPF_REG_6, BPF_REG_7),
+                        BPF_LD_ABS(BPF_B, 0),
+                        BPF_LD_ABS(BPF_H, 0),
+                        BPF_LD_ABS(BPF_W, 0),
+                        BPF_MOV64_IMM(BPF_REG_0, 42),
+                        BPF_EXIT_INSN(),
+                },
+                .data = {
+                        0x34,
+                },
+                .prog_type = BPF_PROG_TYPE_SCHED_CLS,
+                .result = ACCEPT,
+                .retval = 42,
+        },
+        {
+                "ld_abs: jump around ld_abs",
+                .insns = { },
+                .data = {
+                        10, 11,
+                },
+                .fill_helper = bpf_fill_jump_around_ld_abs,
+                .prog_type = BPF_PROG_TYPE_SCHED_CLS,
+                .result = ACCEPT,
+                .retval = 10,
+        },
 };
 static int probe_filter_length(const struct bpf_insn *fp)
@@ -11783,7 +12077,7 @@ static int create_map_in_map(void)
        return outer_map_fd;
 }
-static char bpf_vlog[32768];
+static char bpf_vlog[UINT_MAX >> 8];
 static void do_test_fixup(struct bpf_test *test, struct bpf_insn *prog,
                          int *map_fds)
@@ -11794,6 +12088,9 @@ static void do_test_fixup(struct bpf_test *test, struct bpf_insn *prog,
        int *fixup_prog = test->fixup_prog;
        int *fixup_map_in_map = test->fixup_map_in_map;
+        if (test->fill_helper)
+                test->fill_helper(test);
        /* Allocating HTs with 1 elem is fine here, since we only test
         * for verifier and not do a runtime lookup, so the only thing
         * that really matters is value size in this case.
@@ -11843,10 +12140,8 @@ static void do_test_single(struct bpf_test *test, bool unpriv,
                           int *passes, int *errors)
 {
        int fd_prog, expected_ret, reject_from_alignment;
+        int prog_len, prog_type = test->prog_type;
        struct bpf_insn *prog = test->insns;
-        int prog_len = probe_filter_length(prog);
-        char data_in[TEST_DATA_LEN] = {};
-        int prog_type = test->prog_type;
        int map_fds[MAX_NR_MAPS];
        const char *expected_err;
        uint32_t retval;
@@ -11856,6 +12151,7 @@ static void do_test_single(struct bpf_test *test, bool unpriv,
                map_fds[i] = -1;
        do_test_fixup(test, prog, map_fds);
+        prog_len = probe_filter_length(prog);
        fd_prog = bpf_verify_program(prog_type ? : BPF_PROG_TYPE_SOCKET_FILTER,
                                     prog, prog_len, test->flags & F_LOAD_WITH_STRICT_ALIGNMENT,
@@ -11895,8 +12191,9 @@ static void do_test_single(struct bpf_test *test, bool unpriv,
        }
        if (fd_prog >= 0) {
-                err = bpf_prog_test_run(fd_prog, 1, data_in, sizeof(data_in),
+                err = bpf_prog_test_run(fd_prog, 1, test->data,
-                                        NULL, NULL, &retval, NULL);
+                                        sizeof(test->data), NULL, NULL,
+                                        &retval, NULL);
                if (err && errno != 524/*ENOTSUPP*/ && errno != EPERM) {
                        printf("Unexpected bpf_prog_test_run error\n");
                        goto fail_log;
diff --git a/tools/testing/selftests/bpf/trace_helpers.c b/tools/testing/selftests/bpf/trace_helpers.c
new file mode 100644
index 000000000000..ad025bd75f1c
--- /dev/null
+++ b/tools/testing/selftests/bpf/trace_helpers.c
@@ -0,0 +1,180 @@
+// SPDX-License-Identifier: GPL-2.0
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <assert.h>
+#include <errno.h>
+#include <poll.h>
+#include <unistd.h>
+#include <linux/perf_event.h>
+#include <sys/mman.h>
+#include "trace_helpers.h"
+#define MAX_SYMS 300000
+static struct ksym syms[MAX_SYMS];
+static int sym_cnt;
+static int ksym_cmp(const void *p1, const void *p2)
+{
+        return ((struct ksym *)p1)->addr - ((struct ksym *)p2)->addr;
+}
+int load_kallsyms(void)
+{
+        FILE *f = fopen("/proc/kallsyms", "r");
+        char func[256], buf[256];
+        char symbol;
+        void *addr;
+        int i = 0;
+        if (!f)
+                return -ENOENT;
+        while (!feof(f)) {
+                if (!fgets(buf, sizeof(buf), f))
+                        break;
+                if (sscanf(buf, "%p %c %s", &addr, &symbol, func) != 3)
+                        break;
+                if (!addr)
+                        continue;
+                syms[i].addr = (long) addr;
+                syms[i].name = strdup(func);
+                i++;
+        }
+        sym_cnt = i;
+        qsort(syms, sym_cnt, sizeof(struct ksym), ksym_cmp);
+        return 0;
+}
+struct ksym *ksym_search(long key)
+{
+        int start = 0, end = sym_cnt;
+        int result;
+        while (start < end) {
+                size_t mid = start + (end - start) / 2;
+                result = key - syms[mid].addr;
+                if (result < 0)
+                        end = mid;
+                else if (result > 0)
+                        start = mid + 1;
+                else
+                        return &syms[mid];
+        }
+        if (start >= 1 && syms[start - 1].addr < key &&
+            key < syms[start].addr)
+                /* valid ksym */
+                return &syms[start - 1];
+        /* out of range. return _stext */
+        return &syms[0];
+}
+static int page_size;
+static int page_cnt = 8;
+static volatile struct perf_event_mmap_page *header;
+int perf_event_mmap(int fd)
+{
+        void *base;
+        int mmap_size;
+        page_size = getpagesize();
+        mmap_size = page_size * (page_cnt + 1);
+        base = mmap(NULL, mmap_size, PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0);
+        if (base == MAP_FAILED) {
+                printf("mmap err\n");
+                return -1;
+        }
+        header = base;
+        return 0;
+}
+static int perf_event_poll(int fd)
+{
+        struct pollfd pfd = { .fd = fd, .events = POLLIN };
+        return poll(&pfd, 1, 1000);
+}
+struct perf_event_sample {
+        struct perf_event_header header;
+        __u32 size;
+        char data[];
+};
+static int perf_event_read(perf_event_print_fn fn)
+{
+        __u64 data_tail = header->data_tail;
+        __u64 data_head = header->data_head;
+        __u64 buffer_size = page_cnt * page_size;
+        void *base, *begin, *end;
+        char buf[256];
+        int ret;
+        asm volatile("" ::: "memory"); /* in real code it should be smp_rmb() */
+        if (data_head == data_tail)
+                return PERF_EVENT_CONT;
+        base = ((char *)header) + page_size;
+        begin = base + data_tail % buffer_size;
+        end = base + data_head % buffer_size;
+        while (begin != end) {
+                struct perf_event_sample *e;
+                e = begin;
+                if (begin + e->header.size > base + buffer_size) {
+                        long len = base + buffer_size - begin;
+                        assert(len < e->header.size);
+                        memcpy(buf, begin, len);
+                        memcpy(buf + len, base, e->header.size - len);
+                        e = (void *) buf;
+                        begin = base + e->header.size - len;
+                } else if (begin + e->header.size == base + buffer_size) {
+                        begin = base;
+                } else {
+                        begin += e->header.size;
+                }
+                if (e->header.type == PERF_RECORD_SAMPLE) {
+                        ret = fn(e->data, e->size);
+                        if (ret != PERF_EVENT_CONT)
+                                return ret;
+                } else if (e->header.type == PERF_RECORD_LOST) {
+                        struct {
+                                struct perf_event_header header;
+                                __u64 id;
+                                __u64 lost;
+                        } *lost = (void *) e;
+                        printf("lost %lld events\n", lost->lost);
+                } else {
+                        printf("unknown event type=%d size=%d\n",
+                               e->header.type, e->header.size);
+                }
+        }
+        __sync_synchronize(); /* smp_mb() */
+        header->data_tail = data_head;
+        return PERF_EVENT_CONT;
+}
+int perf_event_poller(int fd, perf_event_print_fn output_fn)
+{
+        int ret;
+        for (;;) {
+                perf_event_poll(fd);
+                ret = perf_event_read(output_fn);
+                if (ret != PERF_EVENT_CONT)
+                        return ret;
+        }
+        return PERF_EVENT_DONE;
+}
diff --git a/tools/testing/selftests/bpf/trace_helpers.h b/tools/testing/selftests/bpf/trace_helpers.h
new file mode 100644
index 000000000000..fe3eefd21e86
--- /dev/null
+++ b/tools/testing/selftests/bpf/trace_helpers.h
@@ -0,0 +1,23 @@
+/* SPDX-License-Identifier: GPL-2.0 */
+#ifndef __TRACE_HELPER_H
+#define __TRACE_HELPER_H
+struct ksym {
+        long addr;
+        char *name;
+};
+int load_kallsyms(void);
+struct ksym *ksym_search(long key);
+typedef int (*perf_event_print_fn)(void *data, int size);
+/* return code for perf_event_print_fn */
+#define PERF_EVENT_DONE         0
+#define PERF_EVENT_ERROR        -1
+#define PERF_EVENT_CONT         -2
+int perf_event_mmap(int fd);
+/* return PERF_EVENT_DONE or PERF_EVENT_ERROR */
+int perf_event_poller(int fd, perf_event_print_fn output_fn);
+#endif
author	David S. Miller <davem@davemloft.net>	2018-05-07 23:35:08 -0400
committer	David S. Miller <davem@davemloft.net>	2018-05-07 23:35:08 -0400
commit	01adc4851a8090b46c7a5ed9cfc4b97e65abfbf4 (patch)
tree	2ae02593d7139962648dff203f3f9701e34ccbc3 /tools
parent	18b338f5f9539512e76fd9ebd4c6ca1a0e159e2b (diff)
parent	e94fa1d93117e7f1eb783dc9cae6c70650944449 (diff)