]> git.ipfire.org Git - thirdparty/linux.git/commitdiff
perf thread: Add optional e_flags output argument to thread__e_machine
authorIan Rogers <irogers@google.com>
Fri, 23 Jan 2026 22:22:07 +0000 (14:22 -0800)
committerArnaldo Carvalho de Melo <acme@redhat.com>
Mon, 26 Jan 2026 21:21:20 +0000 (18:21 -0300)
The e_flags are needed to accurately compute complete perf register
information for CSKY.

Add the ability to read and have this value associated with a thread.

This change doesn't wire up the use of the e_flags except in disasm
where use already exists but just wasn't set up yet.

Signed-off-by: Ian Rogers <irogers@google.com>
Cc: Aditya Bodkhe <aditya.b1@linux.ibm.com>
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Athira Rajeev <atrajeev@linux.ibm.com>
Cc: Chun-Tse Shao <ctshao@google.com>
Cc: Guo Ren <guoren@kernel.org>
Cc: Howard Chu <howardchu95@gmail.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: James Clark <james.clark@linaro.org>
Cc: Jiri Olsa <jolsa@kernel.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Sergei Trofimovich <slyich@gmail.com>
Cc: Shimin Guo <shimin.guo@skydio.com>
Cc: Stephen Brennan <stephen.s.brennan@oracle.com>
Cc: Swapnil Sapkal <swapnil.sapkal@amd.com>
Cc: Tianyou Li <tianyou.li@intel.com>
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
12 files changed:
tools/perf/builtin-script.c
tools/perf/builtin-trace.c
tools/perf/util/annotate.c
tools/perf/util/disasm.c
tools/perf/util/disasm.h
tools/perf/util/dso.c
tools/perf/util/dso.h
tools/perf/util/scripting-engines/trace-event-python.c
tools/perf/util/session.c
tools/perf/util/thread.c
tools/perf/util/thread.h
tools/perf/util/unwind-libdw.c

index 372bede3023096003232088639de139b8754f35c..8c0de27a9713b62962843b3a6eb0cb288399c361 100644 (file)
@@ -2504,11 +2504,17 @@ static void process_event(struct perf_script *script,
                                    symbol_conf.bt_stop_list, fp);
        }
 
-       if (PRINT_FIELD(IREGS))
-               perf_sample__fprintf_iregs(sample, attr, thread__e_machine(thread, machine), fp);
+       if (PRINT_FIELD(IREGS)) {
+               perf_sample__fprintf_iregs(sample, attr,
+                                          thread__e_machine(thread, machine, /*e_flags=*/NULL),
+                                          fp);
+       }
 
-       if (PRINT_FIELD(UREGS))
-               perf_sample__fprintf_uregs(sample, attr, thread__e_machine(thread, machine), fp);
+       if (PRINT_FIELD(UREGS)) {
+               perf_sample__fprintf_uregs(sample, attr,
+                                          thread__e_machine(thread, machine, /*e_flags=*/NULL),
+                                          fp);
+       }
 
        if (PRINT_FIELD(BRSTACK))
                perf_sample__fprintf_brstack(sample, thread, evsel, fp);
index 8df5ca44e4f9152957a3254c7d7f659287147fdd..311d9da9896a41c42574ba8fff9223a3ab01dded 100644 (file)
@@ -2789,7 +2789,7 @@ static int trace__sys_enter(struct trace *trace, struct evsel *evsel,
        struct thread_trace *ttrace;
 
        thread = machine__findnew_thread(trace->host, sample->pid, sample->tid);
-       e_machine = thread__e_machine(thread, trace->host);
+       e_machine = thread__e_machine(thread, trace->host, /*e_flags=*/NULL);
        sc = trace__syscall_info(trace, evsel, e_machine, id);
        if (sc == NULL)
                goto out_put;
@@ -2868,7 +2868,7 @@ static int trace__fprintf_sys_enter(struct trace *trace, struct evsel *evsel,
 
 
        thread = machine__findnew_thread(trace->host, sample->pid, sample->tid);
-       e_machine = thread__e_machine(thread, trace->host);
+       e_machine = thread__e_machine(thread, trace->host, /*e_flags=*/NULL);
        sc = trace__syscall_info(trace, evsel, e_machine, id);
        if (sc == NULL)
                goto out_put;
@@ -2934,7 +2934,7 @@ static int trace__sys_exit(struct trace *trace, struct evsel *evsel,
        struct thread_trace *ttrace;
 
        thread = machine__findnew_thread(trace->host, sample->pid, sample->tid);
-       e_machine = thread__e_machine(thread, trace->host);
+       e_machine = thread__e_machine(thread, trace->host, /*e_flags=*/NULL);
        sc = trace__syscall_info(trace, evsel, e_machine, id);
        if (sc == NULL)
                goto out_put;
@@ -3285,7 +3285,9 @@ static int trace__event_handler(struct trace *trace, struct evsel *evsel,
 
        if (evsel == trace->syscalls.events.bpf_output) {
                int id = perf_evsel__sc_tp_uint(evsel, id, sample);
-               int e_machine = thread ? thread__e_machine(thread, trace->host) : EM_HOST;
+               int e_machine = thread
+                       ? thread__e_machine(thread, trace->host, /*e_flags=*/NULL)
+                       : EM_HOST;
                struct syscall *sc = trace__syscall_info(trace, evsel, e_machine, id);
 
                if (sc) {
@@ -4916,7 +4918,7 @@ static size_t trace__fprintf_thread(FILE *fp, struct thread *thread, struct trac
 {
        size_t printed = 0;
        struct thread_trace *ttrace = thread__priv(thread);
-       int e_machine = thread__e_machine(thread, trace->host);
+       int e_machine = thread__e_machine(thread, trace->host, /*e_flags=*/NULL);
        double ratio;
 
        if (ttrace == NULL)
index c16c6dfaa959675e0fa0e248ad7376cfbd934850..880b1bd300c21e678673aa82cef3fa7f9263b5f9 100644 (file)
@@ -984,6 +984,7 @@ int thread__get_arch(struct thread *thread, const struct arch **parch)
 {
        const struct arch *arch;
        struct machine *machine;
+       uint32_t e_flags;
        uint16_t e_machine;
 
        if (!thread) {
@@ -992,8 +993,8 @@ int thread__get_arch(struct thread *thread, const struct arch **parch)
        }
 
        machine = maps__machine(thread__maps(thread));
-       e_machine = thread__e_machine(thread, machine);
-       arch = arch__find(e_machine, machine->env ? machine->env->cpuid : NULL);
+       e_machine = thread__e_machine(thread, machine, &e_flags);
+       arch = arch__find(e_machine, e_flags, machine->env ? machine->env->cpuid : NULL);
        if (arch == NULL) {
                pr_err("%s: unsupported arch %d\n", __func__, e_machine);
                return errno;
index 9b0ba1fc5aecd0fdd47986a8cbef46f1602524dc..6b36287f30feec6f3d0641740e8d0f1fe50e1465 100644 (file)
@@ -134,7 +134,7 @@ static int arch__cmp(const void *a, const void *b)
        return e_machine_and_eflags__cmp(&(*aa)->id, &(*ab)->id);
 }
 
-const struct arch *arch__find(uint16_t e_machine, const char *cpuid)
+const struct arch *arch__find(uint16_t e_machine, uint32_t e_flags, const char *cpuid)
 {
        static const struct arch *(*const arch_new_fn[])(const struct e_machine_and_e_flags *id,
                                                         const char *cpuid) = {
@@ -157,8 +157,7 @@ const struct arch *arch__find(uint16_t e_machine, const char *cpuid)
        static size_t num_archs;
        struct e_machine_and_e_flags key = {
                .e_machine = e_machine,
-               // TODO: e_flags should really come from the same source as e_machine.
-               .e_flags = EF_HOST,
+               .e_flags = e_flags,
        };
        const struct arch *result = NULL, **tmp;
 
index 6a1905f9d4fc9c47a912d9a1efa2acc2b0c3493c..a6e478caf61a95857e86e1154dbef6d2a2078447 100644 (file)
@@ -108,7 +108,7 @@ struct annotate_args {
        char                      *fileloc;
 };
 
-const struct arch *arch__find(uint16_t e_machine, const char *cpuid);
+const struct arch *arch__find(uint16_t e_machine, uint32_t e_flags, const char *cpuid);
 bool arch__is_x86(const struct arch *arch);
 bool arch__is_powerpc(const struct arch *arch);
 
index 91c9f7cb9d8ce8afdcf94efe76d4672e878f9477..b791e1b6b2cf01f47d23d468b44e154fca841ced 100644 (file)
@@ -1220,14 +1220,20 @@ static enum dso_swap_type dso_swap_type__from_elf_data(unsigned char eidata)
 }
 
 /* Reads e_machine from fd, optionally caching data in dso. */
-uint16_t dso__read_e_machine(struct dso *optional_dso, int fd)
+uint16_t dso__read_e_machine(struct dso *optional_dso, int fd, uint32_t *e_flags)
 {
        uint16_t e_machine = EM_NONE;
        unsigned char e_ident[EI_NIDENT];
        enum dso_swap_type swap_type;
+       bool need_e_flags;
 
-       _Static_assert(offsetof(Elf32_Ehdr, e_ident) == 0, "Unexpected offset");
-       _Static_assert(offsetof(Elf64_Ehdr, e_ident) == 0, "Unexpected offset");
+       if (e_flags)
+               *e_flags = 0;
+
+       {
+               _Static_assert(offsetof(Elf32_Ehdr, e_ident) == 0, "Unexpected offset");
+               _Static_assert(offsetof(Elf64_Ehdr, e_ident) == 0, "Unexpected offset");
+       }
        if (pread(fd, &e_ident, sizeof(e_ident), 0) != sizeof(e_ident))
                return EM_NONE; // Read failed.
 
@@ -1254,18 +1260,35 @@ uint16_t dso__read_e_machine(struct dso *optional_dso, int fd)
        {
                _Static_assert(offsetof(Elf32_Ehdr, e_machine) == 18, "Unexpected offset");
                _Static_assert(offsetof(Elf64_Ehdr, e_machine) == 18, "Unexpected offset");
-               if (pread(fd, &e_machine, sizeof(e_machine), 18) != sizeof(e_machine))
-                       return EM_NONE; // e_machine read failed.
        }
+       if (pread(fd, &e_machine, sizeof(e_machine), 18) != sizeof(e_machine))
+               return EM_NONE; // e_machine read failed.
 
        e_machine = DSO_SWAP_TYPE__SWAP(swap_type, uint16_t, e_machine);
        if (e_machine >= EM_NUM)
                return EM_NONE; // Bad ELF machine number.
 
+#ifdef NDEBUG
+       /* In production code the e_flags are only needed on CSKY. */
+       need_e_flags = e_flags && e_machine == EM_CSKY;
+#else
+       /* Debug code will always read the e_flags. */
+       need_e_flags = e_flags != NULL;
+#endif
+       if (need_e_flags) {
+               off_t offset = e_ident[EI_CLASS] == ELFCLASS32
+                       ? offsetof(Elf32_Ehdr, e_flags)
+                       : offsetof(Elf64_Ehdr, e_flags);
+
+               if (pread(fd, e_flags, sizeof(*e_flags), offset) != sizeof(*e_flags)) {
+                       *e_flags = 0;
+                       return EM_NONE; // e_flags read failed.
+               }
+       }
        return e_machine;
 }
 
-uint16_t dso__e_machine(struct dso *dso, struct machine *machine)
+uint16_t dso__e_machine(struct dso *dso, struct machine *machine, uint32_t *e_flags)
 {
        uint16_t e_machine = EM_NONE;
        int fd;
@@ -1285,6 +1308,8 @@ uint16_t dso__e_machine(struct dso *dso, struct machine *machine)
        case DSO_BINARY_TYPE__BPF_IMAGE:
        case DSO_BINARY_TYPE__OOL:
        case DSO_BINARY_TYPE__JAVA_JIT:
+               if (e_flags)
+                       *e_flags = EF_HOST;
                return EM_HOST;
        case DSO_BINARY_TYPE__DEBUGLINK:
        case DSO_BINARY_TYPE__BUILD_ID_CACHE:
@@ -1299,6 +1324,8 @@ uint16_t dso__e_machine(struct dso *dso, struct machine *machine)
                break;
        case DSO_BINARY_TYPE__NOT_FOUND:
        default:
+               if (e_flags)
+                       *e_flags = 0;
                return EM_NONE;
        }
 
@@ -1311,7 +1338,9 @@ uint16_t dso__e_machine(struct dso *dso, struct machine *machine)
        try_to_open_dso(dso, machine);
        fd = dso__data(dso)->fd;
        if (fd >= 0)
-               e_machine = dso__read_e_machine(dso, fd);
+               e_machine = dso__read_e_machine(dso, fd, e_flags);
+       else if (e_flags)
+               *e_flags = 0;
 
        mutex_unlock(dso__data_open_lock());
        return e_machine;
index a95fee7d634b3105cff57aed76af254d1c7dbb42..ede691e9a24959d9baff589defc9a73e1a33cde0 100644 (file)
@@ -866,8 +866,8 @@ int dso__data_file_size(struct dso *dso, struct machine *machine);
 off_t dso__data_size(struct dso *dso, struct machine *machine);
 ssize_t dso__data_read_offset(struct dso *dso, struct machine *machine,
                              u64 offset, u8 *data, ssize_t size);
-uint16_t dso__read_e_machine(struct dso *optional_dso, int fd);
-uint16_t dso__e_machine(struct dso *dso, struct machine *machine);
+uint16_t dso__read_e_machine(struct dso *optional_dso, int fd, uint32_t *e_flags);
+uint16_t dso__e_machine(struct dso *dso, struct machine *machine, uint32_t *e_flags);
 ssize_t dso__data_read_addr(struct dso *dso, struct map *map,
                            struct machine *machine, u64 addr,
                            u8 *data, ssize_t size);
index b90edc147796531ccdde33f535c6ddf4c636adef..50f0d16520cca6cad297c9f4299f57d5a0263040 100644 (file)
@@ -925,7 +925,7 @@ static PyObject *get_perf_sample_dict(struct perf_sample *sample,
 
        if (al->thread) {
                machine = maps__machine(thread__maps(al->thread));
-               e_machine = thread__e_machine(al->thread, machine);
+               e_machine = thread__e_machine(al->thread, machine, /*e_flags=*/NULL);
        }
        if (set_regs_in_dict(dict, sample, evsel, e_machine))
                Py_FatalError("Failed to setting regs in dict");
index c0231bc000e74697da01dafdc6d4bbdf9ee8eb6c..0e8a128d7c04650e240f86306a039ccd4b500f0f 100644 (file)
@@ -1124,7 +1124,7 @@ static void dump_sample(struct machine *machine, struct evsel *evsel, union perf
        if (sample_type & (PERF_SAMPLE_REGS_USER | PERF_SAMPLE_REGS_INTR)) {
                struct thread *thread = machine__find_thread(machine, sample->pid, sample->pid);
 
-               e_machine = thread__e_machine(thread, machine);
+               e_machine = thread__e_machine(thread, machine, /*e_flags=*/NULL);
        }
 
        printf("(IP, 0x%x): %d/%d: %#" PRIx64 " period: %" PRIu64 " addr: %#" PRIx64 "\n",
@@ -2965,7 +2965,7 @@ static int perf_session__e_machine_cb(struct thread *thread,
        uint16_t *result = arg;
        struct machine *machine = maps__machine(thread__maps(thread));
 
-       *result = thread__e_machine(thread, machine);
+       *result = thread__e_machine(thread, machine, /*e_flags=*/NULL);
        return *result != EM_NONE ? 1 : 0;
 }
 
index 3642858e6cbc33e2ac80f3a7f0e157b116f5edf2..618f29afb160c35d465dfdc1700b1add6ead46e0 100644 (file)
@@ -449,7 +449,7 @@ void thread__find_cpumode_addr_location(struct thread *thread, u64 addr,
        }
 }
 
-static uint16_t read_proc_e_machine_for_pid(pid_t pid)
+static uint16_t read_proc_e_machine_for_pid(pid_t pid, uint32_t *e_flags)
 {
        char path[6 /* "/proc/" */ + 11 /* max length of pid */ + 5 /* "/exe\0" */];
        int fd;
@@ -458,30 +458,46 @@ static uint16_t read_proc_e_machine_for_pid(pid_t pid)
        snprintf(path, sizeof(path), "/proc/%d/exe", pid);
        fd = open(path, O_RDONLY);
        if (fd >= 0) {
-               e_machine = dso__read_e_machine(/*optional_dso=*/NULL, fd);
+               e_machine = dso__read_e_machine(/*optional_dso=*/NULL, fd, e_flags);
                close(fd);
        }
        return e_machine;
 }
 
-static int thread__e_machine_callback(struct map *map, void *machine)
+struct thread__e_machine_callback_args {
+       struct machine *machine;
+       uint32_t e_flags;
+       uint16_t e_machine;
+};
+
+static int thread__e_machine_callback(struct map *map, void *_args)
 {
+       struct thread__e_machine_callback_args *args = _args;
        struct dso *dso = map__dso(map);
 
-       _Static_assert(0 == EM_NONE, "Unexpected EM_NONE");
        if (!dso)
-               return EM_NONE;
+               return 0; // No dso, continue search.
 
-       return dso__e_machine(dso, machine);
+       args->e_machine = dso__e_machine(dso, args->machine, &args->e_flags);
+       return args->e_machine != EM_NONE ? 1 /* stop search */ : 0 /* continue search */;
 }
 
-uint16_t thread__e_machine(struct thread *thread, struct machine *machine)
+uint16_t thread__e_machine(struct thread *thread, struct machine *machine, uint32_t *e_flags)
 {
        pid_t tid, pid;
        uint16_t e_machine = RC_CHK_ACCESS(thread)->e_machine;
+       uint32_t local_e_flags = 0;
+       struct thread__e_machine_callback_args args = {
+               .machine = machine,
+               .e_flags = 0,
+               .e_machine = EM_NONE,
+       };
 
-       if (e_machine != EM_NONE)
+       if (e_machine != EM_NONE) {
+               if (e_flags)
+                       *e_flags = thread__e_flags(thread);
                return e_machine;
+       }
 
        tid = thread__tid(thread);
        pid = thread__pid(thread);
@@ -489,18 +505,19 @@ uint16_t thread__e_machine(struct thread *thread, struct machine *machine)
                struct thread *parent = machine__findnew_thread(machine, pid, pid);
 
                if (parent) {
-                       e_machine = thread__e_machine(parent, machine);
+                       e_machine = thread__e_machine(parent, machine, &local_e_flags);
                        thread__put(parent);
-                       thread__set_e_machine(thread, e_machine);
-                       return e_machine;
+                       goto out;
                }
                /* Something went wrong, fallback. */
        }
        /* Reading on the PID thread. First try to find from the maps. */
-       e_machine = maps__for_each_map(thread__maps(thread),
-                                      thread__e_machine_callback,
-                                      machine);
-       if (e_machine == EM_NONE) {
+       maps__for_each_map(thread__maps(thread), thread__e_machine_callback, &args);
+
+       if (args.e_machine != EM_NONE) {
+               e_machine = args.e_machine;
+               local_e_flags = args.e_flags;
+       } else {
                /* Maps failed, perhaps we're live with map events disabled. */
                bool is_live = machine->machines == NULL;
 
@@ -514,12 +531,18 @@ uint16_t thread__e_machine(struct thread *thread, struct machine *machine)
                }
                /* Read from /proc/pid/exe if live. */
                if (is_live)
-                       e_machine = read_proc_e_machine_for_pid(pid);
+                       e_machine = read_proc_e_machine_for_pid(pid, &local_e_flags);
        }
-       if (e_machine != EM_NONE)
+out:
+       if (e_machine != EM_NONE) {
                thread__set_e_machine(thread, e_machine);
-       else
+               thread__set_e_flags(thread, local_e_flags);
+       } else {
                e_machine = EM_HOST;
+               local_e_flags = EF_HOST;
+       }
+       if (e_flags)
+               *e_flags = local_e_flags;
        return e_machine;
 }
 
index 310eaea344bbc8b8cb8302677986ebe22d8f8ede..f5792d3e8a16f1ce21477df8924361b832616319 100644 (file)
@@ -60,6 +60,10 @@ DECLARE_RC_STRUCT(thread) {
        struct srccode_state    srccode_state;
        bool                    filter;
        int                     filter_entry_depth;
+       /**
+        * @e_flags: The ELF EF_* associated with the thread. Valid if e_machine != EM_NONE.
+        */
+       uint16_t                e_flags;
        /**
         * @e_machine: The ELF EM_* associated with the thread. EM_NONE if not
         * computed.
@@ -307,13 +311,23 @@ static inline void thread__set_filter_entry_depth(struct thread *thread, int dep
        RC_CHK_ACCESS(thread)->filter_entry_depth = depth;
 }
 
-uint16_t thread__e_machine(struct thread *thread, struct machine *machine);
+uint16_t thread__e_machine(struct thread *thread, struct machine *machine, uint32_t *e_flags);
 
 static inline void thread__set_e_machine(struct thread *thread, uint16_t e_machine)
 {
        RC_CHK_ACCESS(thread)->e_machine = e_machine;
 }
 
+static inline uint32_t thread__e_flags(const struct thread *thread)
+{
+       return RC_CHK_ACCESS(thread)->e_flags;
+}
+
+static inline void thread__set_e_flags(struct thread *thread, uint32_t e_flags)
+{
+       RC_CHK_ACCESS(thread)->e_flags = e_flags;
+}
+
 
 static inline bool thread__lbr_stitch_enable(const struct thread *thread)
 {
index 9cb0960ef9050059e2e150c1d4cb293d3447d639..3fdcfa06bf228b734dbec5895e6f7d95223e2e78 100644 (file)
@@ -213,7 +213,7 @@ static bool memory_read(Dwfl *dwfl __maybe_unused, Dwarf_Addr addr, Dwarf_Word *
 {
        struct dwfl_ui_thread_info *dwfl_ui_ti = arg;
        struct unwind_info *ui = dwfl_ui_ti->ui;
-       uint16_t e_machine = thread__e_machine(ui->thread, ui->machine);
+       uint16_t e_machine = thread__e_machine(ui->thread, ui->machine, /*e_flags=*/NULL);
        struct stack_dump *stack = &ui->sample->user_stack;
        u64 start, end;
        int offset;
@@ -348,7 +348,7 @@ int unwind__get_entries(unwind_entry_cb_t cb, void *arg,
 {
        struct maps *maps = thread__maps(thread);
        struct machine *machine = maps__machine(maps);
-       uint16_t e_machine = thread__e_machine(thread, machine);
+       uint16_t e_machine = thread__e_machine(thread, machine, /*e_flags=*/NULL);
        struct dwfl_ui_thread_info *dwfl_ui_ti;
        static struct unwind_info *ui;
        Dwfl *dwfl;