summaryrefslogtreecommitdiff
path: root/tests/dsptest.c
blob: 57596dd1f04544d1fa6f37c282622eb18e7b622c (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
/*
 * MMX optimized DSP utils
 * Copyright (c) 2000, 2001 Gerard Lantau.
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 *
 */

#define TESTCPU_MAIN
#include "dsputil.h"
#include "../libavcodec/i386/cputest.c"
#include "../libavcodec/i386/dsputil_mmx.c"
#undef TESTCPU_MAIN

#define PAD 0x10000
/*
 * for testing speed of various routine - should be probably extended
 * for a general purpose regression test later
 *
 * currently only for i386 - FIXME
 */
static const struct pix_func {
    char* name;
    op_pixels_func func;
    int mm_flags;
} pix_func[] = {
    { "put_pixels_x2_mmx", put_pixels_y2_mmx, MM_MMX },
    { "put_pixels_x2_3dnow", put_pixels_y2_3dnow, MM_3DNOW },
    { "put_pixels_x2_mmx2", put_pixels_y2_mmx2, MM_MMXEXT | PAD },

    { "put_no_rnd_pixels_x2_mmx", put_no_rnd_pixels_x2_mmx, MM_MMX },
    { "put_no_rnd_pixels_x2_3dnow", put_no_rnd_pixels_x2_3dnow, MM_3DNOW },
    { "put_no_rnd_pixels_x2_mmx2", put_no_rnd_pixels_x2_mmx2, MM_MMXEXT | PAD },

    { "put_pixels_y2_mmx", put_pixels_y2_mmx, MM_MMX },
    { "put_pixels_y2_3dnow", put_pixels_y2_3dnow, MM_3DNOW },
    { "put_pixels_y2_mmx2", put_pixels_y2_mmx2, MM_MMXEXT | PAD },
    { 0, 0 }
};

static inline long long rdtsc()
{
    long long l;
    asm volatile(   "rdtsc\n\t"
		    : "=A" (l)
		);
    return l;
}

static test_speed(int step)
{
    const struct pix_func* pix = pix_func;
    const int linesize = 720;
    char empty[32768];
    char* bu =(char*)(((long)empty + 32) & ~0xf);

    while (pix->name)
    {
	int i;
        uint64_t te, ts;
        op_pixels_func func = pix->func;
	char* im = bu;

	if (!(pix->mm_flags & mm_flags))
            continue;

	printf("%30s... ", pix->name);
        fflush(stdout);
	ts = rdtsc();
	for(i=0; i<100000; i++){
	    func(im, im + 1000, linesize, 16);
	    im += step;
	    if (im > bu + 20000)
		im = bu;
	}
	te = rdtsc();
        emms();
	printf("% 9d\n", (int)(te - ts));
	if (pix->mm_flags & PAD)
            puts("");
        pix++;
    }
}

int main(int argc, char* argv[])
{
    int step = 16;

    if (argc > 1)
    {
        // something simple for now
	if (argc > 2 && (strcmp("-s", argv[1]) == 0
			 || strcmp("-step", argv[1]) == 0))
            step = atoi(argv[2]);
    }

    mm_flags = mm_support();
    printf("dsptest: CPU flags:");
    if (mm_flags & MM_MMX)
        printf(" mmx");
    if (mm_flags & MM_MMXEXT)
        printf(" mmxext");
    if (mm_flags & MM_3DNOW)
        printf(" 3dnow");
    if (mm_flags & MM_SSE)
        printf(" sse");
    if (mm_flags & MM_SSE2)
        printf(" sse2");
    printf("\n");

    printf("Using step: %d\n", step);
    test_speed(step);
}