Em Wed, Jun 05, 2019 at 10:16:33AM -0600, Mathieu Poirier escreveu:
> This patch adds the necessay intelligence to properly compute the value
> of 'old' and 'head' when operating in snapshot mode.  That way we can get
> the latest information in the AUX buffer and be compatible with the
> generic AUX ring buffer mechanic.

Leo, have you had the chance to test/review this one? Suzuki?

I also changed the subject to:

  [PATCH] perf cs-etm: Properly set the value of 'old' and 'head' in snapshot 
mode

So that when looking at a 'git log --oneline' one can have the proper
context and know that its about cs-etm.

- Arnaldo
 
> Signed-off-by: Mathieu Poirier <mathieu.poir...@linaro.org>
> ---
>  tools/perf/arch/arm/util/cs-etm.c | 127 +++++++++++++++++++++++++++++-
>  1 file changed, 123 insertions(+), 4 deletions(-)
> 
> diff --git a/tools/perf/arch/arm/util/cs-etm.c 
> b/tools/perf/arch/arm/util/cs-etm.c
> index 911426721170..0a278bbcaba6 100644
> --- a/tools/perf/arch/arm/util/cs-etm.c
> +++ b/tools/perf/arch/arm/util/cs-etm.c
> @@ -31,6 +31,8 @@ struct cs_etm_recording {
>       struct auxtrace_record  itr;
>       struct perf_pmu         *cs_etm_pmu;
>       struct perf_evlist      *evlist;
> +     int                     wrapped_cnt;
> +     bool                    *wrapped;
>       bool                    snapshot_mode;
>       size_t                  snapshot_size;
>  };
> @@ -536,16 +538,131 @@ static int cs_etm_info_fill(struct auxtrace_record 
> *itr,
>       return 0;
>  }
>  
> -static int cs_etm_find_snapshot(struct auxtrace_record *itr __maybe_unused,
> +static int cs_etm_alloc_wrapped_array(struct cs_etm_recording *ptr, int idx)
> +{
> +     bool *wrapped;
> +     int cnt = ptr->wrapped_cnt;
> +
> +     /* Make @ptr->wrapped as big as @idx */
> +     while (cnt <= idx)
> +             cnt++;
> +
> +     /*
> +      * Free'ed in cs_etm_recording_free().  Using realloc() to avoid
> +      * cross compilation problems where the host's system supports
> +      * reallocarray() but not the target.
> +      */
> +     wrapped = realloc(ptr->wrapped, cnt * sizeof(bool));
> +     if (!wrapped)
> +             return -ENOMEM;
> +
> +     wrapped[cnt - 1] = false;
> +     ptr->wrapped_cnt = cnt;
> +     ptr->wrapped = wrapped;
> +
> +     return 0;
> +}
> +
> +static bool cs_etm_buffer_has_wrapped(unsigned char *buffer,
> +                                   size_t buffer_size, u64 head)
> +{
> +     u64 i, watermark;
> +     u64 *buf = (u64 *)buffer;
> +     size_t buf_size = buffer_size;
> +
> +     /*
> +      * We want to look the very last 512 byte (chosen arbitrarily) in
> +      * the ring buffer.
> +      */
> +     watermark = buf_size - 512;
> +
> +     /*
> +      * @head is continuously increasing - if its value is equal or greater
> +      * than the size of the ring buffer, it has wrapped around.
> +      */
> +     if (head >= buffer_size)
> +             return true;
> +
> +     /*
> +      * The value of @head is somewhere within the size of the ring buffer.
> +      * This can be that there hasn't been enough data to fill the ring
> +      * buffer yet or the trace time was so long that @head has numerically
> +      * wrapped around.  To find we need to check if we have data at the very
> +      * end of the ring buffer.  We can reliably do this because mmap'ed
> +      * pages are zeroed out and there is a fresh mapping with every new
> +      * session.
> +      */
> +
> +     /* @head is less than 512 byte from the end of the ring buffer */
> +     if (head > watermark)
> +             watermark = head;
> +
> +     /*
> +      * Speed things up by using 64 bit transactions (see "u64 *buf" above)
> +      */
> +     watermark >>= 3;
> +     buf_size >>= 3;
> +
> +     /*
> +      * If we find trace data at the end of the ring buffer, @head has
> +      * been there and has numerically wrapped around at least once.
> +      */
> +     for (i = watermark; i < buf_size; i++)
> +             if (buf[i])
> +                     return true;
> +
> +     return false;
> +}
> +
> +static int cs_etm_find_snapshot(struct auxtrace_record *itr,
>                               int idx, struct auxtrace_mmap *mm,
> -                             unsigned char *data __maybe_unused,
> +                             unsigned char *data,
>                               u64 *head, u64 *old)
>  {
> +     int err;
> +     bool wrapped;
> +     struct cs_etm_recording *ptr =
> +                     container_of(itr, struct cs_etm_recording, itr);
> +
> +     /*
> +      * Allocate memory to keep track of wrapping if this is the first
> +      * time we deal with this *mm.
> +      */
> +     if (idx >= ptr->wrapped_cnt) {
> +             err = cs_etm_alloc_wrapped_array(ptr, idx);
> +             if (err)
> +                     return err;
> +     }
> +
> +     /*
> +      * Check to see if *head has wrapped around.  If it hasn't only the
> +      * amount of data between *head and *old is snapshot'ed to avoid
> +      * bloating the perf.data file with zeros.  But as soon as *head has
> +      * wrapped around the entire size of the AUX ring buffer it taken.
> +      */
> +     wrapped = ptr->wrapped[idx];
> +     if (!wrapped && cs_etm_buffer_has_wrapped(data, mm->len, *head)) {
> +             wrapped = true;
> +             ptr->wrapped[idx] = true;
> +     }
> +
>       pr_debug3("%s: mmap index %d old head %zu new head %zu size %zu\n",
>                 __func__, idx, (size_t)*old, (size_t)*head, mm->len);
>  
> -     *old = *head;
> -     *head += mm->len;
> +     /* No wrap has occurred, we can just use *head and *old. */
> +     if (!wrapped)
> +             return 0;
> +
> +     /*
> +      * *head has wrapped around - adjust *head and *old to pickup the
> +      * entire content of the AUX buffer.
> +      */
> +     if (*head >= mm->len) {
> +             *old = *head - mm->len;
> +     } else {
> +             *head += mm->len;
> +             *old = *head - mm->len;
> +     }
>  
>       return 0;
>  }
> @@ -586,6 +703,8 @@ static void cs_etm_recording_free(struct auxtrace_record 
> *itr)
>  {
>       struct cs_etm_recording *ptr =
>                       container_of(itr, struct cs_etm_recording, itr);
> +
> +     zfree(&ptr->wrapped);
>       free(ptr);
>  }
>  
> -- 
> 2.17.1

-- 

- Arnaldo

Reply via email to