1 /*******************************************************************************
2 * Copyright (C) 2018 Cadence Design Systems, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining
5 * a copy of this software and associated documentation files (the
6 * "Software"), to use this Software with Cadence processor cores only and
7 * not with any other processors and platforms, subject to
8 * the following conditions:
9 *
10 * The above copyright notice and this permission notice shall be included
11 * in all copies or substantial portions of the Software.
12 *
13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
14 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
15 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
16 * IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
17 * CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
18 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
19 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
20 
21 ******************************************************************************/
22 
23 #ifndef __XA_PROFILER_H__
24 #define __XA_PROFILER_H__
25 
26 #if !defined(PROFILE) && __XCC__
27 #define PROFILE 1
28 #endif
29 
30 #if !defined(PREFETCH_CTL) && __XCC__
31 #define PREFETCH_CTL 1
32 #endif
33 
34 #ifdef PROFILE
35 #include <xtensa/hal.h>
36 #include <sys/times.h>
37 
38 #include "xa_type_def.h"
39 #include "xa_timer.h"
40 
41 TRACE_TAG(MCPS,1);
42 
43 typedef struct XA_PROFILER {
44 #if 1
45     unsigned long cstart;
46     unsigned long cstop;
47     unsigned long cycles;
48     unsigned long g_output_bytes;
49     unsigned long Peak;
50     unsigned long Sum;
51 
52     unsigned long sample_rate;
53     unsigned long channels;
54     unsigned long pcm_width;
55 #else
56     struct tms start;
57     struct tms stop;
58     double Peak;
59     double Sum;
60     long long cycles;
61 #endif
62     int Peak_frame;
63     int frame_count;
64     long long output_bytes;
65     long long total_cycles;
66     long long total_samples;
67     char *id;
68 } xa_profiler;
69 
70 extern xa_profiler prof;
71 
72 static inline void xa_compute_mcps(xa_profiler *p_prof, WORD32 samples_decoded, UWORD32 samp_freq, long long gen_strm_pos)
73 {
74     double Ave=0.0, Curr;
75 
76     if (samples_decoded <= 0)
77         return;
78 
79     p_prof->total_samples += samples_decoded;
80     p_prof->frame_count++;
81 
82     clock_t cycles = p_prof->cycles;
83     p_prof->total_cycles = 0;
84     Curr = ((double) cycles / samples_decoded * samp_freq / 1000000);
85 
86     if (p_prof->frame_count > 1) {
87         p_prof->Sum += Curr;
88         Ave = p_prof->Sum / (p_prof->frame_count-1);
89 
90         if (p_prof->Peak < Curr) {
91             p_prof->Peak = Curr;
92             p_prof->Peak_frame = (p_prof->frame_count);
93         }
94     }
95 
96     unsigned long long total_msec =
97         (unsigned long long)((double)p_prof->total_samples / samp_freq * 1000.0);
98     int msec = (int)(total_msec % 1000);
99     unsigned long long total_seconds = total_msec / 1000;
100     int seconds = (int)(total_seconds % 60);
101     int minutes = (int)(total_seconds / 60);
102 
103 #if 1
104     TRACE(MCPS, _b("[%d] %d:%d.%d MCPS: %d Average: %d samples: %d\n"),
105         p_prof->frame_count, (uint32_t)minutes, (uint32_t)seconds, (uint32_t)msec,
106         (uint32_t)Curr, (uint32_t)Ave, samples_decoded);
107 #else
108     TRACE(MCPS, _b("[%d|%lld] %d:%02d.%03d MCPS: %.2f Average: %.2f Peak: %.2f @ [%d] %s\n"),
109         p_prof->frame_count, gen_strm_pos, minutes, seconds, msec,
110         Curr, Ave, p_prof->Peak, p_prof->Peak_frame, p_prof->id);
111 #endif
112 
113     /* reset counters */
114     p_prof->g_output_bytes = 0;
115     p_prof->cycles = 0;
116 }
117 
118 #define INIT_XA_PROFILER(x, a)                  do { memset(&x, 0, sizeof(xa_profiler)); \
119                                                      x.sample_rate = 48000;\
120                                                      x.channels = 2;\
121                                                      x.pcm_width = 16;\
122                                                      x.id = a; } while(0)
123 
124 #define START_TIME_XA_PROFILER(x)               do { set_ccount(0); \
125                                                      x.cstart=read_ccount(); } while(0)
126 #define STOP_TIME_XA_PROFILER(x)                do { x.cstop =read_ccount(); \
127                                                      x.cycles += (x.cstop - x.cstart); } while(0)
128 #define COMPUTE_MHZ_XA_PROFILER(x, a, b, c)        do { xa_compute_mcps(&x, a, b, c); } while(0)
129 #define SUMMARY_XA_PROFILER(x)                  do { fprintf(stdout,"\n%5s Peak MCPS = %f\n", x.id, x.Peak); \
130                                                      fprintf(stdout,"%5s Peak frame = %d\n", x.id, x.Peak_frame); \
131                                                      fprintf(stdout,"%5s Average MCPS = %f\n", x.id, (x.frame_count < 2) ? 0 : (x.Sum/(x.frame_count-1))); } while(0)
132 
133 #else
134 
135 typedef struct XA_PROFILER {
136     int place_holder;
137 } xa_profiler;
138 
139 #define INIT_XA_PROFILER(x, a)                  do {} while(0)
140 #define START_TIME_XA_PROFILER(x)               do {} while(0)
141 #define STOP_TIME_XA_PROFILER(x)                do {} while(0)
142 #define COMPUTE_MHZ_XA_PROFILER(x, a, b)        do {} while(0)
143 #define SUMMARY_XA_PROFILER(x)                  do {} while(0)
144 #endif
145 
146 #ifdef PREFETCH_CTL
147 #define PREFETCH_AGGRESSIVE(x)                  do { x = xthal_set_cache_prefetch ((XTHAL_DCACHE_PREFETCH_HIGH | XTHAL_ICACHE_PREFETCH_HIGH)); \
148                                                    } while(0)
149 #define PREFETCH_RESTORE(x)                     do { xthal_set_cache_prefetch (x); } while(0)
150 #else
151 #define PREFETCH_AGGRESSIVE(x)                  do {} while(0)
152 #define PREFETCH_RESTORE(x)                     do {} while(0)
153 #endif
154 
155 #endif /* __XA_PROFILER_H__ */
156 
157