summaryrefslogtreecommitdiff
path: root/libavcodec/ppc/dsputil_ppc.h
blob: 8c325fbc75fdf62cafb13df23dc0885a886c6fe4 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
/*
 * Copyright (c) 2003 Romain Dolbeau <romain@dolbeau.org>
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 */

#ifndef _DSPUTIL_PPC_
#define _DSPUTIL_PPC_

#ifdef CONFIG_DARWIN
/* The Apple assembler shipped w/ gcc-3.3 knows about DCBZL, previous assemblers don't
   We assume here that the Darwin GCC is from Apple.... */
#if (__GNUC__ * 100 + __GNUC_MINOR__ < 303)
#define NO_DCBZL
#endif
#else /* CONFIG_DARWIN */
/* I don't think any non-Apple assembler knows about DCBZL */
#define NO_DCBZL
#endif /* CONFIG_DARWIN */

#ifdef POWERPC_TBL_PERFORMANCE_REPORT
void powerpc_display_perf_report(void);
/* if you add to the enum below, also add to the perfname array
   in dsputil_ppc.c */
enum powerpc_perf_index {
  altivec_fft_num = 0,
  altivec_gmc1_num,
  altivec_dct_unquantize_h263_num,
  altivec_idct_add_num,
  altivec_idct_put_num,
  altivec_put_pixels16_num,
  altivec_avg_pixels16_num,
  altivec_avg_pixels8_num,
  altivec_put_pixels8_xy2_num,
  altivec_put_no_rnd_pixels8_xy2_num,
  altivec_put_pixels16_xy2_num,
  altivec_put_no_rnd_pixels16_xy2_num,
  powerpc_clear_blocks_dcbz32,
  powerpc_clear_blocks_dcbz128,
  powerpc_perf_total
};
enum powerpc_data_index {
  powerpc_data_min = 0,
  powerpc_data_max,
  powerpc_data_sum,
  powerpc_data_num,
  powerpc_data_total
};
extern unsigned long long perfdata[powerpc_perf_total][powerpc_data_total];
#ifdef POWERPC_PERF_USE_PMC
extern unsigned long long perfdata_pmc2[powerpc_perf_total][powerpc_data_total];
extern unsigned long long perfdata_pmc3[powerpc_perf_total][powerpc_data_total];
#endif

#ifndef POWERPC_PERF_USE_PMC
#define POWERPC_GET_CYCLES(a) asm volatile("mftb %0" : "=r" (a))
#define POWERPC_TBL_DECLARE(a, cond) register unsigned long tbl_start, tbl_stop
#define POWERPC_TBL_START_COUNT(a, cond) do { POWERPC_GET_CYCLES(tbl_start); } while (0)
#define POWERPC_TBL_STOP_COUNT(a, cond) do {     \
  POWERPC_GET_CYCLES(tbl_stop);                  \
  if (tbl_stop > tbl_start)                      \
  {                                              \
    unsigned long diff =  tbl_stop - tbl_start;  \
    if (cond)                                    \
    {                                            \
      if (diff < perfdata[a][powerpc_data_min])  \
        perfdata[a][powerpc_data_min] = diff;    \
      if (diff > perfdata[a][powerpc_data_max])  \
        perfdata[a][powerpc_data_max] = diff;    \
      perfdata[a][powerpc_data_sum] += diff;     \
      perfdata[a][powerpc_data_num] ++;          \
    }                                            \
  }                                              \
} while (0)

#else /* POWERPC_PERF_USE_PMC */
#define POWERPC_GET_CYCLES(a) asm volatile("mfspr %0, 937" : "=r" (a))
#define POWERPC_GET_PMC2(a) asm volatile("mfspr %0, 938" : "=r" (a))
#define POWERPC_GET_PMC3(a) asm volatile("mfspr %0, 941" : "=r" (a))
#define POWERPC_TBL_DECLARE(a, cond) register unsigned long cycles_start, cycles_stop, pmc2_start, pmc2_stop, pmc3_start, pmc3_stop
#define POWERPC_TBL_START_COUNT(a, cond) do {    \
  POWERPC_GET_PMC3(pmc3_start);                  \
  POWERPC_GET_PMC2(pmc2_start);                  \
  POWERPC_GET_CYCLES(cycles_start); } while (0)
#define POWERPC_TBL_STOP_COUNT(a, cond) do {     \
  POWERPC_GET_CYCLES(cycles_stop);               \
  POWERPC_GET_PMC2(pmc2_stop);                   \
  POWERPC_GET_PMC3(pmc3_stop);                   \
  if (cycles_stop >= cycles_start)               \
  {                                              \
    unsigned long diff =                         \
                cycles_stop - cycles_start;      \
    if (cond)                                    \
    {                                            \
      if (diff < perfdata[a][powerpc_data_min])  \
        perfdata[a][powerpc_data_min] = diff;    \
      if (diff > perfdata[a][powerpc_data_max])  \
        perfdata[a][powerpc_data_max] = diff;    \
      perfdata[a][powerpc_data_sum] += diff;     \
      perfdata[a][powerpc_data_num] ++;          \
    }                                            \
  }                                              \
  if (pmc2_stop >= pmc2_start)                   \
  {                                              \
    unsigned long diff =                         \
                pmc2_stop - pmc2_start;          \
    if (cond)                                    \
    {                                            \
      if (diff < perfdata_pmc2[a][powerpc_data_min]) \
        perfdata_pmc2[a][powerpc_data_min] = diff;   \
      if (diff > perfdata_pmc2[a][powerpc_data_max]) \
        perfdata_pmc2[a][powerpc_data_max] = diff;   \
      perfdata_pmc2[a][powerpc_data_sum] += diff;    \
      perfdata_pmc2[a][powerpc_data_num] ++;         \
    }                                            \
  }                                              \
  if (pmc3_stop >= pmc3_start)                   \
  {                                              \
    unsigned long diff =                         \
                pmc3_stop - pmc3_start;          \
    if (cond)                                    \
    {                                            \
      if (diff < perfdata_pmc3[a][powerpc_data_min]) \
        perfdata_pmc3[a][powerpc_data_min] = diff;   \
      if (diff > perfdata_pmc3[a][powerpc_data_max]) \
        perfdata_pmc3[a][powerpc_data_max] = diff;   \
      perfdata_pmc3[a][powerpc_data_sum] += diff;    \
      perfdata_pmc3[a][powerpc_data_num] ++;         \
    }                                            \
  }                                              \
} while (0)

#endif /* POWERPC_PERF_USE_PMC */


#else /* POWERPC_TBL_PERFORMANCE_REPORT */
// those are needed to avoid empty statements.
#define POWERPC_TBL_DECLARE(a, cond)        int altivec_placeholder __attribute__ ((unused))
#define POWERPC_TBL_START_COUNT(a, cond)    do {} while (0)
#define POWERPC_TBL_STOP_COUNT(a, cond)     do {} while (0)
#endif /* POWERPC_TBL_PERFORMANCE_REPORT */

#endif /*  _DSPUTIL_PPC_ */