perf intel-pt: Add support for emulated ptwrite
authorAdrian Hunter <adrian.hunter@intel.com>
Mon, 9 May 2022 15:23:58 +0000 (18:23 +0300)
committerArnaldo Carvalho de Melo <acme@redhat.com>
Tue, 17 May 2022 14:55:49 +0000 (11:55 -0300)
ptwrite is an Intel x86 instruction that writes arbitrary values into an
Intel PT trace. It is not supported on all hardware, so provide an
alternative that makes use of TNT packets to convey the payload data.
TNT packets encode Taken/Not-taken conditional branch information, so
taking branches based on the payload value will encode the value into
the TNT packet. Refer to the changes to the documentation file
perf-intel-pt.txt in this patch for an example.

Signed-off-by: Adrian Hunter <adrian.hunter@intel.com>
Cc: Jiri Olsa <jolsa@kernel.org>
Link: https://lore.kernel.org/r/20220509152400.376613-2-adrian.hunter@intel.com
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
tools/perf/Documentation/perf-intel-pt.txt
tools/perf/util/intel-pt-decoder/intel-pt-decoder.c
tools/perf/util/intel-pt-decoder/intel-pt-decoder.h
tools/perf/util/intel-pt-decoder/intel-pt-insn-decoder.c
tools/perf/util/intel-pt-decoder/intel-pt-insn-decoder.h
tools/perf/util/intel-pt.c

index 92532d0..8acd704 100644 (file)
@@ -468,6 +468,8 @@ ptw         Enable PTWRITE packets which are produced when a ptwrite instruction
                which contains "1" if the feature is supported and
                "0" otherwise.
 
+               As an alternative, refer to "Emulated PTWRITE" further below.
+
 fup_on_ptw     Enable a FUP packet to follow the PTWRITE packet.  The FUP packet
                provides the address of the ptwrite instruction.  In the absence of
                fup_on_ptw, the decoder will use the address of the previous branch
@@ -1471,6 +1473,92 @@ In that case the --itrace q option is forced because walking executable code
 to reconstruct the control flow is not possible.
 
 
+Emulated PTWRITE
+----------------
+
+Later perf tools support a method to emulate the ptwrite instruction, which
+can be useful if hardware does not support the ptwrite instruction.
+
+Instead of using the ptwrite instruction, a function is used which produces
+a trace that encodes the payload data into TNT packets.  Here is an example
+of the function:
+
+ #include <stdint.h>
+
+ void perf_emulate_ptwrite(uint64_t x)
+ __attribute__((externally_visible, noipa, no_instrument_function, naked));
+
+ #define PERF_EMULATE_PTWRITE_8_BITS \
+                 "1: shl %rax\n"     \
+                 "   jc 1f\n"        \
+                 "1: shl %rax\n"     \
+                 "   jc 1f\n"        \
+                 "1: shl %rax\n"     \
+                 "   jc 1f\n"        \
+                 "1: shl %rax\n"     \
+                 "   jc 1f\n"        \
+                 "1: shl %rax\n"     \
+                 "   jc 1f\n"        \
+                 "1: shl %rax\n"     \
+                 "   jc 1f\n"        \
+                 "1: shl %rax\n"     \
+                 "   jc 1f\n"        \
+                 "1: shl %rax\n"     \
+                 "   jc 1f\n"
+
+ /* Undefined instruction */
+ #define PERF_EMULATE_PTWRITE_UD2        ".byte 0x0f, 0x0b\n"
+
+ #define PERF_EMULATE_PTWRITE_MAGIC        PERF_EMULATE_PTWRITE_UD2 ".ascii \"perf,ptwrite  \"\n"
+
+ void perf_emulate_ptwrite(uint64_t x __attribute__ ((__unused__)))
+ {
+          /* Assumes SysV ABI : x passed in rdi */
+         __asm__ volatile (
+                 "jmp 1f\n"
+                 PERF_EMULATE_PTWRITE_MAGIC
+                 "1: mov %rdi, %rax\n"
+                 PERF_EMULATE_PTWRITE_8_BITS
+                 PERF_EMULATE_PTWRITE_8_BITS
+                 PERF_EMULATE_PTWRITE_8_BITS
+                 PERF_EMULATE_PTWRITE_8_BITS
+                 PERF_EMULATE_PTWRITE_8_BITS
+                 PERF_EMULATE_PTWRITE_8_BITS
+                 PERF_EMULATE_PTWRITE_8_BITS
+                 PERF_EMULATE_PTWRITE_8_BITS
+                 "1: ret\n"
+         );
+ }
+
+For example, a test program with the function above:
+
+ #include <stdio.h>
+ #include <stdint.h>
+ #include <stdlib.h>
+
+ #include "perf_emulate_ptwrite.h"
+
+ int main(int argc, char *argv[])
+ {
+         uint64_t x = 0;
+
+         if (argc > 1)
+                 x = strtoull(argv[1], NULL, 0);
+         perf_emulate_ptwrite(x);
+         return 0;
+ }
+
+Can be compiled and traced:
+
+ $ gcc -Wall -Wextra -O3 -g -o eg_ptw eg_ptw.c
+ $ perf record -e intel_pt//u ./eg_ptw 0x1234567890abcdef
+ [ perf record: Woken up 1 times to write data ]
+ [ perf record: Captured and wrote 0.017 MB perf.data ]
+ $ perf script --itrace=ew
+           eg_ptw 19875 [007]  8061.235912:     ptwrite:  IP: 0 payload: 0x1234567890abcdef      55701249a196 perf_emulate_ptwrite+0x16 (/home/user/eg_ptw)
+ $
+
+
 EXAMPLE
 -------
 
index e1d8f75..0ac860c 100644 (file)
@@ -137,6 +137,7 @@ struct intel_pt_decoder {
        bool in_psb;
        bool hop;
        bool leap;
+       bool emulated_ptwrite;
        bool vm_time_correlation;
        bool vm_tm_corr_dry_run;
        bool vm_tm_corr_reliable;
@@ -481,6 +482,8 @@ static int intel_pt_ext_err(int code)
                return INTEL_PT_ERR_LOST;
        case -ELOOP:
                return INTEL_PT_ERR_NELOOP;
+       case -ECONNRESET:
+               return INTEL_PT_ERR_EPTW;
        default:
                return INTEL_PT_ERR_UNK;
        }
@@ -497,6 +500,7 @@ static const char *intel_pt_err_msgs[] = {
        [INTEL_PT_ERR_LOST]   = "Lost trace data",
        [INTEL_PT_ERR_UNK]    = "Unknown error!",
        [INTEL_PT_ERR_NELOOP] = "Never-ending loop (refer perf config intel-pt.max-loops)",
+       [INTEL_PT_ERR_EPTW]   = "Broken emulated ptwrite",
 };
 
 int intel_pt__strerror(int code, char *buf, size_t buflen)
@@ -1535,17 +1539,108 @@ static int intel_pt_walk_tip(struct intel_pt_decoder *decoder)
        return intel_pt_bug(decoder);
 }
 
+struct eptw_data {
+       int bit_countdown;
+       uint64_t payload;
+};
+
+static int intel_pt_eptw_lookahead_cb(struct intel_pt_pkt_info *pkt_info)
+{
+       struct eptw_data *data = pkt_info->data;
+       int nr_bits;
+
+       switch (pkt_info->packet.type) {
+       case INTEL_PT_PAD:
+       case INTEL_PT_MNT:
+       case INTEL_PT_MODE_EXEC:
+       case INTEL_PT_MODE_TSX:
+       case INTEL_PT_MTC:
+       case INTEL_PT_FUP:
+       case INTEL_PT_CYC:
+       case INTEL_PT_CBR:
+       case INTEL_PT_TSC:
+       case INTEL_PT_TMA:
+       case INTEL_PT_PIP:
+       case INTEL_PT_VMCS:
+       case INTEL_PT_PSB:
+       case INTEL_PT_PSBEND:
+       case INTEL_PT_PTWRITE:
+       case INTEL_PT_PTWRITE_IP:
+       case INTEL_PT_EXSTOP:
+       case INTEL_PT_EXSTOP_IP:
+       case INTEL_PT_MWAIT:
+       case INTEL_PT_PWRE:
+       case INTEL_PT_PWRX:
+       case INTEL_PT_BBP:
+       case INTEL_PT_BIP:
+       case INTEL_PT_BEP:
+       case INTEL_PT_BEP_IP:
+       case INTEL_PT_CFE:
+       case INTEL_PT_CFE_IP:
+       case INTEL_PT_EVD:
+               break;
+
+       case INTEL_PT_TNT:
+               nr_bits = data->bit_countdown;
+               if (nr_bits > pkt_info->packet.count)
+                       nr_bits = pkt_info->packet.count;
+               data->payload <<= nr_bits;
+               data->payload |= pkt_info->packet.payload >> (64 - nr_bits);
+               data->bit_countdown -= nr_bits;
+               return !data->bit_countdown;
+
+       case INTEL_PT_TIP_PGE:
+       case INTEL_PT_TIP_PGD:
+       case INTEL_PT_TIP:
+       case INTEL_PT_BAD:
+       case INTEL_PT_OVF:
+       case INTEL_PT_TRACESTOP:
+       default:
+               return 1;
+       }
+
+       return 0;
+}
+
+static int intel_pt_emulated_ptwrite(struct intel_pt_decoder *decoder)
+{
+       int n = 64 - decoder->tnt.count;
+       struct eptw_data data = {
+               .bit_countdown = n,
+               .payload = decoder->tnt.payload >> n,
+       };
+
+       decoder->emulated_ptwrite = false;
+       intel_pt_log("Emulated ptwrite detected\n");
+
+       intel_pt_pkt_lookahead(decoder, intel_pt_eptw_lookahead_cb, &data);
+       if (data.bit_countdown)
+               return -ECONNRESET;
+
+       decoder->state.type = INTEL_PT_PTW;
+       decoder->state.from_ip = decoder->ip;
+       decoder->state.to_ip = 0;
+       decoder->state.ptw_payload = data.payload;
+       return 0;
+}
+
 static int intel_pt_walk_tnt(struct intel_pt_decoder *decoder)
 {
        struct intel_pt_insn intel_pt_insn;
        int err;
 
        while (1) {
+               if (decoder->emulated_ptwrite)
+                       return intel_pt_emulated_ptwrite(decoder);
                err = intel_pt_walk_insn(decoder, &intel_pt_insn, 0);
-               if (err == INTEL_PT_RETURN)
+               if (err == INTEL_PT_RETURN) {
+                       decoder->emulated_ptwrite = intel_pt_insn.emulated_ptwrite;
                        return 0;
-               if (err)
+               }
+               if (err) {
+                       decoder->emulated_ptwrite = false;
                        return err;
+               }
 
                if (intel_pt_insn.op == INTEL_PT_OP_RET) {
                        if (!decoder->return_compression) {
index efb2cb3..c773028 100644 (file)
@@ -58,6 +58,7 @@ enum {
        INTEL_PT_ERR_LOST,
        INTEL_PT_ERR_UNK,
        INTEL_PT_ERR_NELOOP,
+       INTEL_PT_ERR_EPTW,
        INTEL_PT_ERR_MAX,
 };
 
index 9d5e65c..1376077 100644 (file)
@@ -32,6 +32,7 @@ static void intel_pt_insn_decoder(struct insn *insn,
        int ext;
 
        intel_pt_insn->rel = 0;
+       intel_pt_insn->emulated_ptwrite = false;
 
        if (insn_is_avx(insn)) {
                intel_pt_insn->op = INTEL_PT_OP_OTHER;
index c2861cf..e3338b5 100644 (file)
@@ -37,6 +37,7 @@ enum intel_pt_insn_branch {
 struct intel_pt_insn {
        enum intel_pt_insn_op           op;
        enum intel_pt_insn_branch       branch;
+       bool                            emulated_ptwrite;
        int                             length;
        int32_t                         rel;
        unsigned char                   buf[INTEL_PT_INSN_BUF_SZ];
index ec43d36..c7e115f 100644 (file)
@@ -530,6 +530,7 @@ struct intel_pt_cache_entry {
        u64                             byte_cnt;
        enum intel_pt_insn_op           op;
        enum intel_pt_insn_branch       branch;
+       bool                            emulated_ptwrite;
        int                             length;
        int32_t                         rel;
        char                            insn[INTEL_PT_INSN_BUF_SZ];
@@ -616,6 +617,7 @@ static int intel_pt_cache_add(struct dso *dso, struct machine *machine,
        e->byte_cnt = byte_cnt;
        e->op = intel_pt_insn->op;
        e->branch = intel_pt_insn->branch;
+       e->emulated_ptwrite = intel_pt_insn->emulated_ptwrite;
        e->length = intel_pt_insn->length;
        e->rel = intel_pt_insn->rel;
        memcpy(e->insn, intel_pt_insn->buf, INTEL_PT_INSN_BUF_SZ);
@@ -702,6 +704,28 @@ static int intel_pt_get_guest(struct intel_pt_queue *ptq)
        return 0;
 }
 
+static inline bool intel_pt_jmp_16(struct intel_pt_insn *intel_pt_insn)
+{
+       return intel_pt_insn->rel == 16 && intel_pt_insn->branch == INTEL_PT_BR_UNCONDITIONAL;
+}
+
+#define PTWRITE_MAGIC          "\x0f\x0bperf,ptwrite  "
+#define PTWRITE_MAGIC_LEN      16
+
+static bool intel_pt_emulated_ptwrite(struct dso *dso, struct machine *machine, u64 offset)
+{
+       unsigned char buf[PTWRITE_MAGIC_LEN];
+       ssize_t len;
+
+       len = dso__data_read_offset(dso, machine, offset, buf, PTWRITE_MAGIC_LEN);
+       if (len == PTWRITE_MAGIC_LEN && !memcmp(buf, PTWRITE_MAGIC, PTWRITE_MAGIC_LEN)) {
+               intel_pt_log("Emulated ptwrite signature found\n");
+               return true;
+       }
+       intel_pt_log("Emulated ptwrite signature not found\n");
+       return false;
+}
+
 static int intel_pt_walk_next_insn(struct intel_pt_insn *intel_pt_insn,
                                   uint64_t *insn_cnt_ptr, uint64_t *ip,
                                   uint64_t to_ip, uint64_t max_insn_cnt,
@@ -764,6 +788,7 @@ static int intel_pt_walk_next_insn(struct intel_pt_insn *intel_pt_insn,
                                *ip += e->byte_cnt;
                                intel_pt_insn->op = e->op;
                                intel_pt_insn->branch = e->branch;
+                               intel_pt_insn->emulated_ptwrite = e->emulated_ptwrite;
                                intel_pt_insn->length = e->length;
                                intel_pt_insn->rel = e->rel;
                                memcpy(intel_pt_insn->buf, e->insn,
@@ -795,8 +820,18 @@ static int intel_pt_walk_next_insn(struct intel_pt_insn *intel_pt_insn,
 
                        insn_cnt += 1;
 
-                       if (intel_pt_insn->branch != INTEL_PT_BR_NO_BRANCH)
+                       if (intel_pt_insn->branch != INTEL_PT_BR_NO_BRANCH) {
+                               bool eptw;
+                               u64 offs;
+
+                               if (!intel_pt_jmp_16(intel_pt_insn))
+                                       goto out;
+                               /* Check for emulated ptwrite */
+                               offs = offset + intel_pt_insn->length;
+                               eptw = intel_pt_emulated_ptwrite(al.map->dso, machine, offs);
+                               intel_pt_insn->emulated_ptwrite = eptw;
                                goto out;
+                       }
 
                        if (max_insn_cnt && insn_cnt >= max_insn_cnt)
                                goto out_no_cache;