From: Madhavan Srinivasan <ma...@linux.vnet.ibm.com>

Introduce new perf sample_type PERF_SAMPLE_PIPELINE_HAZ to request kernel
to provide cpu pipeline hazard data. Also, introduce arch independent
structure 'perf_pipeline_haz_data' to pass hazard data to userspace. This
is generic structure and arch specific data needs to be converted to this
format.

Signed-off-by: Madhavan Srinivasan <ma...@linux.vnet.ibm.com>
Signed-off-by: Ravi Bangoria <ravi.bango...@linux.ibm.com>
---
 include/linux/perf_event.h            |  7 ++++++
 include/uapi/linux/perf_event.h       | 32 ++++++++++++++++++++++++++-
 kernel/events/core.c                  |  6 +++++
 tools/include/uapi/linux/perf_event.h | 32 ++++++++++++++++++++++++++-
 4 files changed, 75 insertions(+), 2 deletions(-)

diff --git a/include/linux/perf_event.h b/include/linux/perf_event.h
index 547773f5894e..d5b606e3c57d 100644
--- a/include/linux/perf_event.h
+++ b/include/linux/perf_event.h
@@ -1001,6 +1001,7 @@ struct perf_sample_data {
        u64                             stack_user_size;
 
        u64                             phys_addr;
+       struct perf_pipeline_haz_data   pipeline_haz;
 } ____cacheline_aligned;
 
 /* default value for data source */
@@ -1021,6 +1022,12 @@ static inline void perf_sample_data_init(struct 
perf_sample_data *data,
        data->weight = 0;
        data->data_src.val = PERF_MEM_NA;
        data->txn = 0;
+       data->pipeline_haz.itype = PERF_HAZ__ITYPE_NA;
+       data->pipeline_haz.icache = PERF_HAZ__ICACHE_NA;
+       data->pipeline_haz.hazard_stage = PERF_HAZ__PIPE_STAGE_NA;
+       data->pipeline_haz.hazard_reason = PERF_HAZ__HREASON_NA;
+       data->pipeline_haz.stall_stage = PERF_HAZ__PIPE_STAGE_NA;
+       data->pipeline_haz.stall_reason = PERF_HAZ__SREASON_NA;
 }
 
 extern void perf_output_sample(struct perf_output_handle *handle,
diff --git a/include/uapi/linux/perf_event.h b/include/uapi/linux/perf_event.h
index 377d794d3105..ff252618ca93 100644
--- a/include/uapi/linux/perf_event.h
+++ b/include/uapi/linux/perf_event.h
@@ -142,8 +142,9 @@ enum perf_event_sample_format {
        PERF_SAMPLE_REGS_INTR                   = 1U << 18,
        PERF_SAMPLE_PHYS_ADDR                   = 1U << 19,
        PERF_SAMPLE_AUX                         = 1U << 20,
+       PERF_SAMPLE_PIPELINE_HAZ                = 1U << 21,
 
-       PERF_SAMPLE_MAX = 1U << 21,             /* non-ABI */
+       PERF_SAMPLE_MAX = 1U << 22,             /* non-ABI */
 
        __PERF_SAMPLE_CALLCHAIN_EARLY           = 1ULL << 63, /* non-ABI; 
internal use */
 };
@@ -870,6 +871,13 @@ enum perf_event_type {
         *      { u64                   phys_addr;} && PERF_SAMPLE_PHYS_ADDR
         *      { u64                   size;
         *        char                  data[size]; } && PERF_SAMPLE_AUX
+        *      { u8                    itype;
+        *        u8                    icache;
+        *        u8                    hazard_stage;
+        *        u8                    hazard_reason;
+        *        u8                    stall_stage;
+        *        u8                    stall_reason;
+        *        u16                   pad;} && PERF_SAMPLE_PIPELINE_HAZ
         * };
         */
        PERF_RECORD_SAMPLE                      = 9,
@@ -1185,4 +1193,26 @@ struct perf_branch_entry {
                reserved:40;
 };
 
+struct perf_pipeline_haz_data {
+       /* Instruction/Opcode type: Load, Store, Branch .... */
+       __u8    itype;
+       /* Instruction Cache source */
+       __u8    icache;
+       /* Instruction suffered hazard in pipeline stage */
+       __u8    hazard_stage;
+       /* Hazard reason */
+       __u8    hazard_reason;
+       /* Instruction suffered stall in pipeline stage */
+       __u8    stall_stage;
+       /* Stall reason */
+       __u8    stall_reason;
+       __u16   pad;
+};
+
+#define PERF_HAZ__ITYPE_NA     0x0
+#define PERF_HAZ__ICACHE_NA    0x0
+#define PERF_HAZ__PIPE_STAGE_NA        0x0
+#define PERF_HAZ__HREASON_NA   0x0
+#define PERF_HAZ__SREASON_NA   0x0
+
 #endif /* _UAPI_LINUX_PERF_EVENT_H */
diff --git a/kernel/events/core.c b/kernel/events/core.c
index e453589da97c..d00037c77ccf 100644
--- a/kernel/events/core.c
+++ b/kernel/events/core.c
@@ -1754,6 +1754,9 @@ static void __perf_event_header_size(struct perf_event 
*event, u64 sample_type)
        if (sample_type & PERF_SAMPLE_PHYS_ADDR)
                size += sizeof(data->phys_addr);
 
+       if (sample_type & PERF_SAMPLE_PIPELINE_HAZ)
+               size += sizeof(data->pipeline_haz);
+
        event->header_size = size;
 }
 
@@ -6712,6 +6715,9 @@ void perf_output_sample(struct perf_output_handle *handle,
                        perf_aux_sample_output(event, handle, data);
        }
 
+       if (sample_type & PERF_SAMPLE_PIPELINE_HAZ)
+               perf_output_put(handle, data->pipeline_haz);
+
        if (!event->attr.watermark) {
                int wakeup_events = event->attr.wakeup_events;
 
diff --git a/tools/include/uapi/linux/perf_event.h 
b/tools/include/uapi/linux/perf_event.h
index 377d794d3105..ff252618ca93 100644
--- a/tools/include/uapi/linux/perf_event.h
+++ b/tools/include/uapi/linux/perf_event.h
@@ -142,8 +142,9 @@ enum perf_event_sample_format {
        PERF_SAMPLE_REGS_INTR                   = 1U << 18,
        PERF_SAMPLE_PHYS_ADDR                   = 1U << 19,
        PERF_SAMPLE_AUX                         = 1U << 20,
+       PERF_SAMPLE_PIPELINE_HAZ                = 1U << 21,
 
-       PERF_SAMPLE_MAX = 1U << 21,             /* non-ABI */
+       PERF_SAMPLE_MAX = 1U << 22,             /* non-ABI */
 
        __PERF_SAMPLE_CALLCHAIN_EARLY           = 1ULL << 63, /* non-ABI; 
internal use */
 };
@@ -870,6 +871,13 @@ enum perf_event_type {
         *      { u64                   phys_addr;} && PERF_SAMPLE_PHYS_ADDR
         *      { u64                   size;
         *        char                  data[size]; } && PERF_SAMPLE_AUX
+        *      { u8                    itype;
+        *        u8                    icache;
+        *        u8                    hazard_stage;
+        *        u8                    hazard_reason;
+        *        u8                    stall_stage;
+        *        u8                    stall_reason;
+        *        u16                   pad;} && PERF_SAMPLE_PIPELINE_HAZ
         * };
         */
        PERF_RECORD_SAMPLE                      = 9,
@@ -1185,4 +1193,26 @@ struct perf_branch_entry {
                reserved:40;
 };
 
+struct perf_pipeline_haz_data {
+       /* Instruction/Opcode type: Load, Store, Branch .... */
+       __u8    itype;
+       /* Instruction Cache source */
+       __u8    icache;
+       /* Instruction suffered hazard in pipeline stage */
+       __u8    hazard_stage;
+       /* Hazard reason */
+       __u8    hazard_reason;
+       /* Instruction suffered stall in pipeline stage */
+       __u8    stall_stage;
+       /* Stall reason */
+       __u8    stall_reason;
+       __u16   pad;
+};
+
+#define PERF_HAZ__ITYPE_NA     0x0
+#define PERF_HAZ__ICACHE_NA    0x0
+#define PERF_HAZ__PIPE_STAGE_NA        0x0
+#define PERF_HAZ__HREASON_NA   0x0
+#define PERF_HAZ__SREASON_NA   0x0
+
 #endif /* _UAPI_LINUX_PERF_EVENT_H */
-- 
2.21.1

Reply via email to