perf cs-etm: Set sample flags for instruction range packet
authorLeo Yan <leo.yan@linaro.org>
Tue, 29 Jan 2019 12:28:36 +0000 (20:28 +0800)
committerArnaldo Carvalho de Melo <acme@redhat.com>
Wed, 6 Feb 2019 13:00:40 +0000 (10:00 -0300)
The perf sample data contains flags to indicate the hardware trace data
is belonging to which type branch instruction, thus this can be used to
print out the human readable string.  Arm CoreSight ETM sample data is
missed to set flags and it is always set to zeros, this results in perf
tool skips to print string for instruction types.

This patch is to set branch instruction flags for instruction range
packet.

Signed-off-by: Leo Yan <leo.yan@linaro.org>
Reviewed-by: Mathieu Poirier <mathieu.poirier@linaro.org>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Mike Leach <mike.leach@linaro.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Robert Walker <robert.walker@arm.com>
Cc: Suzuki K Poulouse <suzuki.poulose@arm.com>
Cc: coresight ml <coresight@lists.linaro.org>
Cc: linux-arm-kernel@lists.infradead.org
Link: http://lkml.kernel.org/r/20190129122842.32041-3-leo.yan@linaro.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
tools/perf/util/cs-etm-decoder/cs-etm-decoder.c
tools/perf/util/cs-etm-decoder/cs-etm-decoder.h
tools/perf/util/cs-etm.c

index 8a19310500d9fd4393f6acf07ec096bc5b83b7f7..e98ee49a1527b49237721c5f99e4c8610c7022bf 100644 (file)
@@ -293,6 +293,7 @@ static void cs_etm_decoder__clear_buffer(struct cs_etm_decoder *decoder)
                decoder->packet_buffer[i].last_instr_type = 0;
                decoder->packet_buffer[i].last_instr_subtype = 0;
                decoder->packet_buffer[i].last_instr_cond = 0;
+               decoder->packet_buffer[i].flags = 0;
                decoder->packet_buffer[i].cpu = INT_MIN;
        }
 }
@@ -329,6 +330,7 @@ cs_etm_decoder__buffer_packet(struct cs_etm_decoder *decoder,
        decoder->packet_buffer[et].last_instr_type = 0;
        decoder->packet_buffer[et].last_instr_subtype = 0;
        decoder->packet_buffer[et].last_instr_cond = 0;
+       decoder->packet_buffer[et].flags = 0;
 
        if (decoder->packet_count == MAX_BUFFER - 1)
                return OCSD_RESP_WAIT;
index 7cdd6a9c68a7b6ccab3d39c5d09d9298b83f3ee4..23600e57a2159d359f91695cdc604ad43df64cef 100644 (file)
@@ -45,6 +45,7 @@ struct cs_etm_packet {
        u32 instr_count;
        u32 last_instr_type;
        u32 last_instr_subtype;
+       u32 flags;
        u8 last_instr_cond;
        u8 last_instr_taken_branch;
        u8 last_instr_size;
index 27a374ddf6615eb6018a9b4135ca07a50d689cd0..d05cac5295f1a15792fc45b4575b463ed31747c1 100644 (file)
@@ -12,6 +12,7 @@
 #include <linux/log2.h>
 #include <linux/types.h>
 
+#include <opencsd/ocsd_if_types.h>
 #include <stdlib.h>
 
 #include "auxtrace.h"
@@ -719,7 +720,7 @@ static int cs_etm__synth_instruction_sample(struct cs_etm_queue *etmq,
        sample.stream_id = etmq->etm->instructions_id;
        sample.period = period;
        sample.cpu = etmq->packet->cpu;
-       sample.flags = 0;
+       sample.flags = etmq->prev_packet->flags;
        sample.insn_len = 1;
        sample.cpumode = event->sample.header.misc;
 
@@ -778,7 +779,7 @@ static int cs_etm__synth_branch_sample(struct cs_etm_queue *etmq)
        sample.stream_id = etmq->etm->branches_id;
        sample.period = 1;
        sample.cpu = etmq->packet->cpu;
-       sample.flags = 0;
+       sample.flags = etmq->prev_packet->flags;
        sample.cpumode = event->sample.header.misc;
 
        /*
@@ -1107,6 +1108,80 @@ static int cs_etm__end_block(struct cs_etm_queue *etmq)
        return 0;
 }
 
+static int cs_etm__set_sample_flags(struct cs_etm_queue *etmq)
+{
+       struct cs_etm_packet *packet = etmq->packet;
+
+       switch (packet->sample_type) {
+       case CS_ETM_RANGE:
+               /*
+                * Immediate branch instruction without neither link nor
+                * return flag, it's normal branch instruction within
+                * the function.
+                */
+               if (packet->last_instr_type == OCSD_INSTR_BR &&
+                   packet->last_instr_subtype == OCSD_S_INSTR_NONE) {
+                       packet->flags = PERF_IP_FLAG_BRANCH;
+
+                       if (packet->last_instr_cond)
+                               packet->flags |= PERF_IP_FLAG_CONDITIONAL;
+               }
+
+               /*
+                * Immediate branch instruction with link (e.g. BL), this is
+                * branch instruction for function call.
+                */
+               if (packet->last_instr_type == OCSD_INSTR_BR &&
+                   packet->last_instr_subtype == OCSD_S_INSTR_BR_LINK)
+                       packet->flags = PERF_IP_FLAG_BRANCH |
+                                       PERF_IP_FLAG_CALL;
+
+               /*
+                * Indirect branch instruction with link (e.g. BLR), this is
+                * branch instruction for function call.
+                */
+               if (packet->last_instr_type == OCSD_INSTR_BR_INDIRECT &&
+                   packet->last_instr_subtype == OCSD_S_INSTR_BR_LINK)
+                       packet->flags = PERF_IP_FLAG_BRANCH |
+                                       PERF_IP_FLAG_CALL;
+
+               /*
+                * Indirect branch instruction with subtype of
+                * OCSD_S_INSTR_V7_IMPLIED_RET, this is explicit hint for
+                * function return for A32/T32.
+                */
+               if (packet->last_instr_type == OCSD_INSTR_BR_INDIRECT &&
+                   packet->last_instr_subtype == OCSD_S_INSTR_V7_IMPLIED_RET)
+                       packet->flags = PERF_IP_FLAG_BRANCH |
+                                       PERF_IP_FLAG_RETURN;
+
+               /*
+                * Indirect branch instruction without link (e.g. BR), usually
+                * this is used for function return, especially for functions
+                * within dynamic link lib.
+                */
+               if (packet->last_instr_type == OCSD_INSTR_BR_INDIRECT &&
+                   packet->last_instr_subtype == OCSD_S_INSTR_NONE)
+                       packet->flags = PERF_IP_FLAG_BRANCH |
+                                       PERF_IP_FLAG_RETURN;
+
+               /* Return instruction for function return. */
+               if (packet->last_instr_type == OCSD_INSTR_BR_INDIRECT &&
+                   packet->last_instr_subtype == OCSD_S_INSTR_V8_RET)
+                       packet->flags = PERF_IP_FLAG_BRANCH |
+                                       PERF_IP_FLAG_RETURN;
+               break;
+       case CS_ETM_DISCONTINUITY:
+       case CS_ETM_EXCEPTION:
+       case CS_ETM_EXCEPTION_RET:
+       case CS_ETM_EMPTY:
+       default:
+               break;
+       }
+
+       return 0;
+}
+
 static int cs_etm__run_decoder(struct cs_etm_queue *etmq)
 {
        struct cs_etm_auxtrace *etm = etmq->etm;
@@ -1158,6 +1233,17 @@ static int cs_etm__run_decoder(struct cs_etm_queue *etmq)
                                         */
                                        break;
 
+                               /*
+                                * Since packet addresses are swapped in packet
+                                * handling within below switch() statements,
+                                * thus setting sample flags must be called
+                                * prior to switch() statement to use address
+                                * information before packets swapping.
+                                */
+                               err = cs_etm__set_sample_flags(etmq);
+                               if (err < 0)
+                                       break;
+
                                switch (etmq->packet->sample_type) {
                                case CS_ETM_RANGE:
                                        /*