Current PERF_SAMPLE_WEIGHT sample type is very useful to expresses the
cost of an action represented by the sample. This allows the profiler
to scale the samples to be more informative to the programmer. It could
also help to locate a hotspot, e.g., when profiling by memory latencies,
the expensive load appear higher up in the histograms. But current
PERF_SAMPLE_WEIGHT sample type is solely determined by one factor. This
could be a problem, if users want two or more factors to contribute to
the weight. For example, Golden Cove core PMU can provide both the
instruction latency and the cache Latency information as factors for the
memory profiling.
For current X86 platforms, although meminfo::latency is defined as a
u64, only the lower 32 bits include the valid data in practice (No
memory access could last than 4G cycles). The higher 32 bits can be used
to store new factors.
Add a new sample type, PERF_SAMPLE_WEIGHT_STRUCT, to indicate the new
sample weight structure. It shares the same space as the
PERF_SAMPLE_WEIGHT sample type.
Users can apply either the PERF_SAMPLE_WEIGHT sample type or the
PERF_SAMPLE_WEIGHT_STRUCT sample type to retrieve the sample weight, but
they cannot apply both sample types simultaneously.
Currently, only X86 and PowerPC use the PERF_SAMPLE_WEIGHT sample type.
- For PowerPC, there is nothing changed for the PERF_SAMPLE_WEIGHT
  sample type. There is no effect for the new PERF_SAMPLE_WEIGHT_STRUCT
  sample type. PowerPC can re-struct the weight field similarly later.
- For X86, the same value will be dumped for the PERF_SAMPLE_WEIGHT
  sample type or the PERF_SAMPLE_WEIGHT_STRUCT sample type for now.
  The following patches will apply the new factors for the
  PERF_SAMPLE_WEIGHT_STRUCT sample type.
The field in the union perf_sample_weight should be shared among
different architectures. A generic name is required, but it's hard to
abstract a name that applies to all architectures. For example, on X86,
the fields are to store all kinds of latency. While on PowerPC, it
stores MMCRA[TECX/TECM], which should not be latency. So a general name
prefix 'var$NUM' is used here.
Suggested-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Signed-off-by: Kan Liang <kan.liang@linux.intel.com>
Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Link: https://lkml.kernel.org/r/1611873611-156687-2-git-send-email-kan.liang@linux.intel.com
 
                if (event->attr.sample_type & PERF_SAMPLE_WEIGHT &&
                                                ppmu->get_mem_weight)
-                       ppmu->get_mem_weight(&data.weight);
+                       ppmu->get_mem_weight(&data.weight.full);
 
                if (perf_event_overflow(event, &data, regs))
                        power_pmu_stop(event, 0);
 
 }
 
 #define PERF_PEBS_MEMINFO_TYPE (PERF_SAMPLE_ADDR | PERF_SAMPLE_DATA_SRC |   \
-                               PERF_SAMPLE_PHYS_ADDR | PERF_SAMPLE_WEIGHT | \
+                               PERF_SAMPLE_PHYS_ADDR |                      \
+                               PERF_SAMPLE_WEIGHT_TYPE |                    \
                                PERF_SAMPLE_TRANSACTION |                    \
                                PERF_SAMPLE_DATA_PAGE_SIZE)
 
        gprs = (sample_type & PERF_SAMPLE_REGS_INTR) &&
               (attr->sample_regs_intr & PEBS_GP_REGS);
 
-       tsx_weight = (sample_type & PERF_SAMPLE_WEIGHT) &&
+       tsx_weight = (sample_type & PERF_SAMPLE_WEIGHT_TYPE) &&
                     ((attr->config & INTEL_ARCH_EVENT_MASK) ==
                      x86_pmu.rtm_abort_event);
 
        /*
         * Use latency for weight (only avail with PEBS-LL)
         */
-       if (fll && (sample_type & PERF_SAMPLE_WEIGHT))
-               data->weight = pebs->lat;
+       if (fll && (sample_type & PERF_SAMPLE_WEIGHT_TYPE))
+               data->weight.full = pebs->lat;
 
        /*
         * data.data_src encodes the data source
 
        if (x86_pmu.intel_cap.pebs_format >= 2) {
                /* Only set the TSX weight when no memory weight. */
-               if ((sample_type & PERF_SAMPLE_WEIGHT) && !fll)
-                       data->weight = intel_get_tsx_weight(pebs->tsx_tuning);
+               if ((sample_type & PERF_SAMPLE_WEIGHT_TYPE) && !fll)
+                       data->weight.full = intel_get_tsx_weight(pebs->tsx_tuning);
 
                if (sample_type & PERF_SAMPLE_TRANSACTION)
                        data->txn = intel_get_tsx_transaction(pebs->tsx_tuning,
        }
 
        if (format_size & PEBS_DATACFG_MEMINFO) {
-               if (sample_type & PERF_SAMPLE_WEIGHT)
-                       data->weight = meminfo->latency ?:
+               if (sample_type & PERF_SAMPLE_WEIGHT_TYPE)
+                       data->weight.full = meminfo->latency ?:
                                intel_get_tsx_weight(meminfo->tsx_tuning);
 
                if (sample_type & PERF_SAMPLE_DATA_SRC)
 
        struct perf_raw_record          *raw;
        struct perf_branch_stack        *br_stack;
        u64                             period;
-       u64                             weight;
+       union perf_sample_weight        weight;
        u64                             txn;
        union  perf_mem_data_src        data_src;
 
        data->raw  = NULL;
        data->br_stack = NULL;
        data->period = period;
-       data->weight = 0;
+       data->weight.full = 0;
        data->data_src.val = PERF_MEM_NA;
        data->txn = 0;
 }
 
        PERF_SAMPLE_CGROUP                      = 1U << 21,
        PERF_SAMPLE_DATA_PAGE_SIZE              = 1U << 22,
        PERF_SAMPLE_CODE_PAGE_SIZE              = 1U << 23,
+       PERF_SAMPLE_WEIGHT_STRUCT               = 1U << 24,
 
-       PERF_SAMPLE_MAX = 1U << 24,             /* non-ABI */
+       PERF_SAMPLE_MAX = 1U << 25,             /* non-ABI */
 
        __PERF_SAMPLE_CALLCHAIN_EARLY           = 1ULL << 63, /* non-ABI; internal use */
 };
 
+#define PERF_SAMPLE_WEIGHT_TYPE        (PERF_SAMPLE_WEIGHT | PERF_SAMPLE_WEIGHT_STRUCT)
 /*
  * values to program into branch_sample_type when PERF_SAMPLE_BRANCH is set
  *
         *        char                  data[size];
         *        u64                   dyn_size; } && PERF_SAMPLE_STACK_USER
         *
-        *      { u64                   weight;   } && PERF_SAMPLE_WEIGHT
+        *      { union perf_sample_weight
+        *       {
+        *              u64             full; && PERF_SAMPLE_WEIGHT
+        *      #if defined(__LITTLE_ENDIAN_BITFIELD)
+        *              struct {
+        *                      u32     var1_dw;
+        *                      u16     var2_w;
+        *                      u16     var3_w;
+        *              } && PERF_SAMPLE_WEIGHT_STRUCT
+        *      #elif defined(__BIG_ENDIAN_BITFIELD)
+        *              struct {
+        *                      u16     var3_w;
+        *                      u16     var2_w;
+        *                      u32     var1_dw;
+        *              } && PERF_SAMPLE_WEIGHT_STRUCT
+        *      #endif
+        *       }
+        *      }
         *      { u64                   data_src; } && PERF_SAMPLE_DATA_SRC
         *      { u64                   transaction; } && PERF_SAMPLE_TRANSACTION
         *      { u64                   abi; # enum perf_sample_regs_abi
                reserved:40;
 };
 
+union perf_sample_weight {
+       __u64           full;
+#if defined(__LITTLE_ENDIAN_BITFIELD)
+       struct {
+               __u32   var1_dw;
+               __u16   var2_w;
+               __u16   var3_w;
+       };
+#elif defined(__BIG_ENDIAN_BITFIELD)
+       struct {
+               __u16   var3_w;
+               __u16   var2_w;
+               __u32   var1_dw;
+       };
+#else
+#error "Unknown endianness"
+#endif
+};
+
 #endif /* _UAPI_LINUX_PERF_EVENT_H */
 
        if (sample_type & PERF_SAMPLE_PERIOD)
                size += sizeof(data->period);
 
-       if (sample_type & PERF_SAMPLE_WEIGHT)
-               size += sizeof(data->weight);
+       if (sample_type & PERF_SAMPLE_WEIGHT_TYPE)
+               size += sizeof(data->weight.full);
 
        if (sample_type & PERF_SAMPLE_READ)
                size += event->read_size;
                                          data->regs_user.regs);
        }
 
-       if (sample_type & PERF_SAMPLE_WEIGHT)
-               perf_output_put(handle, data->weight);
+       if (sample_type & PERF_SAMPLE_WEIGHT_TYPE)
+               perf_output_put(handle, data->weight.full);
 
        if (sample_type & PERF_SAMPLE_DATA_SRC)
                perf_output_put(handle, data->data_src.val);
        if (attr->sample_type & PERF_SAMPLE_CGROUP)
                return -EINVAL;
 #endif
+       if ((attr->sample_type & PERF_SAMPLE_WEIGHT) &&
+           (attr->sample_type & PERF_SAMPLE_WEIGHT_STRUCT))
+               return -EINVAL;
 
 out:
        return ret;