annotate TOOLS/fastmemcpybench.c @ 28894:b29169fccda9

Fix and restructure fastmemcpybench. It is now one binary that runs all available memcpy variants and prints benchmark results about them.
author diego
date Tue, 10 Mar 2009 10:05:09 +0000
parents 5643b5e6bee0
children 1d34931ae1e6
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
1 /*
28869
04a232eb5f0d comment/output cosmetics
diego
parents: 28868
diff changeset
2 * benchmark tool for fast_memcpy code from libvo
04a232eb5f0d comment/output cosmetics
diego
parents: 28868
diff changeset
3 *
04a232eb5f0d comment/output cosmetics
diego
parents: 28868
diff changeset
4 * NOTE: This code can not be used on Pentium MMX / II because they contain
04a232eb5f0d comment/output cosmetics
diego
parents: 28868
diff changeset
5 * a bug in rdtsc. For Intel processors since P6(PII) rdpmc should be used
04a232eb5f0d comment/output cosmetics
diego
parents: 28868
diff changeset
6 * instead. For PIII it's disputable and it seems the bug was fixed but this
04a232eb5f0d comment/output cosmetics
diego
parents: 28868
diff changeset
7 * was not confirmed through testing.
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
8 */
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
9
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
10 #include <stdio.h>
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
11 #include <stdlib.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
12 #include <string.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
13 #include <sys/ioctl.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
14 #include <unistd.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
15 #include <fcntl.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
16 #include <sys/mman.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
17 #include <sys/time.h>
13839
40391656ae23 small compilation fix
rathann
parents: 3082
diff changeset
18 #include <inttypes.h>
28894
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
19
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
20 #include "config.h"
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
21 #include "cpudetect.h"
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
22
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
23 #define BLOCK_SIZE 4096
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
24 #define CONFUSION_FACTOR 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
25
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
26 #if HAVE_MMX
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
27 #define COMPILE_MMX
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
28 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
29
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
30 #if HAVE_MMX2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
31 #define COMPILE_MMX2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
32 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
33
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
34 #if HAVE_AMD3DNOW
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
35 #define COMPILE_AMD3DNOW
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
36 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
37
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
38 #if HAVE_SSE
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
39 #define COMPILE_SSE
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
40 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
41
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
42 #ifdef COMPILE_MMX
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
43 #undef RENAME
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
44 #undef HAVE_MMX
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
45 #undef HAVE_MMX2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
46 #undef HAVE_AMD3DNOW
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
47 #undef HAVE_SSE
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
48 #undef HAVE_SSE2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
49 #define HAVE_MMX 1
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
50 #define HAVE_MMX2 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
51 #define HAVE_AMD3DNOW 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
52 #define HAVE_SSE 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
53 #define HAVE_SSE2 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
54 #define RENAME(a) a ## _MMX
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
55 #include "libvo/aclib_template.c"
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
56 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
57
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
58 #ifdef COMPILE_MMX2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
59 #undef RENAME
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
60 #undef HAVE_MMX
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
61 #undef HAVE_MMX2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
62 #undef HAVE_AMD3DNOW
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
63 #undef HAVE_SSE
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
64 #undef HAVE_SSE2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
65 #define HAVE_MMX 1
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
66 #define HAVE_MMX2 1
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
67 #define HAVE_AMD3DNOW 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
68 #define HAVE_SSE 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
69 #define HAVE_SSE2 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
70 #define RENAME(a) a ## _MMX2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
71 #include "libvo/aclib_template.c"
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
72 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
73
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
74 #ifdef COMPILE_AMD3DNOW
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
75 #undef RENAME
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
76 #undef HAVE_MMX
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
77 #undef HAVE_MMX2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
78 #undef HAVE_AMD3DNOW
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
79 #undef HAVE_SSE
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
80 #undef HAVE_SSE2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
81 #define HAVE_MMX 1
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
82 #define HAVE_MMX2 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
83 #define HAVE_AMD3DNOW 1
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
84 #define HAVE_SSE 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
85 #define HAVE_SSE2 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
86 #define RENAME(a) a ## _3DNow
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
87 #include "libvo/aclib_template.c"
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
88 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
89
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
90 #ifdef COMPILE_SSE
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
91 #undef RENAME
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
92 #undef HAVE_MMX
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
93 #undef HAVE_MMX2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
94 #undef HAVE_AMD3DNOW
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
95 #undef HAVE_SSE
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
96 #undef HAVE_SSE2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
97 #define HAVE_MMX 1
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
98 #define HAVE_MMX2 1
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
99 #define HAVE_AMD3DNOW 0
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
100 #define HAVE_SSE 1
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
101 #define HAVE_SSE2 1
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
102 #define RENAME(a) a ## _SSE
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
103 #include "libvo/aclib_template.c"
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
104 #endif
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
105
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
106 //#define ARR_SIZE 100000
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
107 #define ARR_SIZE (1024*768*2)
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
108
27365
13c920fdf7f5 Change a bunch of video-output-specific preprocessor directives from a HAVE_
diego
parents: 26759
diff changeset
109 #ifdef CONFIG_MGA
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
110
17017
dd053aeb5442 Unify include path handling by using -I.
diego
parents: 13839
diff changeset
111 #include "drivers/mga_vid.h"
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
112
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
113 static mga_vid_config_t mga_vid_config;
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
114 static unsigned char* frame = NULL;
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
115 static int f;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
116
28232
8df85ad26746 Add missing 'void' keyword to parameterless function declarations.
diego
parents: 27757
diff changeset
117 static int mga_init(void)
8df85ad26746 Add missing 'void' keyword to parameterless function declarations.
diego
parents: 27757
diff changeset
118 {
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
119 f = open("/dev/mga_vid", O_RDWR);
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
120 if (f == -1) {
28869
04a232eb5f0d comment/output cosmetics
diego
parents: 28868
diff changeset
121 fprintf(stderr, "Couldn't open /dev/mga_vid.\n");
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
122 return -1;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
123 }
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
124
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
125 mga_vid_config.num_frames = 1;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
126 mga_vid_config.frame_size = ARR_SIZE;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
127 mga_vid_config.format = MGA_VID_FORMAT_YUY2;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
128
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
129 mga_vid_config.colkey_on = 0;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
130 mga_vid_config.src_width = 640;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
131 mga_vid_config.src_height = 480;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
132 mga_vid_config.dest_width = 320;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
133 mga_vid_config.dest_height = 200;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
134 mga_vid_config.x_org = 0;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
135 mga_vid_config.y_org = 0;
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
136
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
137 mga_vid_config.version = MGA_VID_VERSION;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
138 if (ioctl(f, MGA_VID_CONFIG, &mga_vid_config)) {
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
139 perror("Error in mga_vid_config ioctl()");
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
140 printf("Your mga_vid driver version is incompatible with this MPlayer version!\n");
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
141 exit(1);
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
142 }
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
143 ioctl(f, MGA_VID_ON, 0);
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
144
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
145 frame = (char*)mmap(0, mga_vid_config.frame_size*mga_vid_config.num_frames,
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
146 PROT_WRITE,MAP_SHARED, f, 0);
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
147 if (!frame) {
28869
04a232eb5f0d comment/output cosmetics
diego
parents: 28868
diff changeset
148 printf("Can't mmap MGA frame.\n");
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
149 exit(1);
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
150 }
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
151
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
152 //clear the buffer
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
153 //memset(frames[0], 0x80, mga_vid_config.frame_size*mga_vid_config.num_frames);
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
154
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
155 return 0;
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
156 }
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
157
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
158 #endif
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
159
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
160 // Returns current time in microseconds
28232
8df85ad26746 Add missing 'void' keyword to parameterless function declarations.
diego
parents: 27757
diff changeset
161 static unsigned int GetTimer(void)
8df85ad26746 Add missing 'void' keyword to parameterless function declarations.
diego
parents: 27757
diff changeset
162 {
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
163 struct timeval tv;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
164 struct timezone tz;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
165 //float s;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
166 gettimeofday(&tv, &tz);
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
167 //s = tv.tv_usec; s *= 0.000001; s += tv.tv_sec;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
168 return tv.tv_sec * 1000000 + tv.tv_usec;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
169 }
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
170
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
171 static inline unsigned long long int read_tsc(void)
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
172 {
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
173 unsigned long long int retval;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
174 __asm__ volatile ("rdtsc":"=A" (retval)::"memory");
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
175 return retval;
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
176 }
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
177
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
178 unsigned char __attribute__((aligned(4096)))arr1[ARR_SIZE], arr2[ARR_SIZE];
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
179
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
180 int main(void)
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
181 {
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
182 unsigned long long int v1, v2;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
183 unsigned char *marr1, *marr2;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
184 int i;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
185 unsigned int t;
27365
13c920fdf7f5 Change a bunch of video-output-specific preprocessor directives from a HAVE_
diego
parents: 26759
diff changeset
186 #ifdef CONFIG_MGA
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
187 mga_init();
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
188 marr1 = &frame[3];
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
189 #else
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
190 marr1 = &arr1[0];
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
191 #endif
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
192 marr2 = &arr2[0];
3076
bfc881c0e591 newly allocated memory seems to point to only 1 zero filled 4k page or something so there is a near 100% cache hit rate ... not very realistic, writeing something in the source array fixes that so the benchmark scores are meaningfull now
michael
parents: 687
diff changeset
193
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
194 for (i = 0; i < ARR_SIZE - 16; i++)
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
195 marr1[i] = marr2[i] = i;
3076
bfc881c0e591 newly allocated memory seems to point to only 1 zero filled 4k page or something so there is a near 100% cache hit rate ... not very realistic, writeing something in the source array fixes that so the benchmark scores are meaningfull now
michael
parents: 687
diff changeset
196
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
197 t = GetTimer();
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
198 v1 = read_tsc();
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
199 for (i = 0; i < 100; i++)
28894
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
200 memcpy(marr1, marr2, ARR_SIZE - 16);
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
201 v2 = read_tsc();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
202 t = GetTimer() - t;
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
203 // ARR_SIZE*100 / (1024*1024) / (t/1000000) = ARR_SIZE*95.36743 / t
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
204 printf("libc: CPU clocks=%llu = %dus (%5.3ffps) %5.1fMB/s\n", v2-v1, t,
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
205 100000000.0f/(float)t, (float)ARR_SIZE*95.36743f/(float)t);
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
206
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
207 #if HAVE_MMX
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
208 t = GetTimer();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
209 v1 = read_tsc();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
210 for (i = 0; i < 100; i++)
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
211 fast_memcpy_MMX(marr1, marr2, ARR_SIZE - 16);
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
212 v2 = read_tsc();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
213 t = GetTimer() - t;
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
214 // ARR_SIZE*100 / (1024*1024) / (t/1000000) = ARR_SIZE*95.36743 / t
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
215 printf("MMX: CPU clocks=%llu = %dus (%5.3ffps) %5.1fMB/s\n", v2-v1, t,
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
216 100000000.0f/(float)t, (float)ARR_SIZE*95.36743f/(float)t);
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
217 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
218
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
219 #if HAVE_AMD3DNOW
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
220 t = GetTimer();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
221 v1 = read_tsc();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
222 for (i = 0; i < 100; i++)
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
223 fast_memcpy_3DNow(marr1, marr2, ARR_SIZE - 16);
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
224 v2 = read_tsc();
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
225 t = GetTimer() - t;
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
226 // ARR_SIZE*100 / (1024*1024) / (t/1000000) = ARR_SIZE*95.36743 / t
28894
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
227 printf("3DNow!: CPU clocks=%llu = %dus (%5.3ffps) %5.1fMB/s\n", v2-v1, t,
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
228 100000000.0f/(float)t, (float)ARR_SIZE*95.36743f/(float)t);
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
229 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
230
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
231 #if HAVE_MMX2
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
232 t = GetTimer();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
233 v1 = read_tsc();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
234 for (i = 0; i < 100; i++)
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
235 fast_memcpy_MMX2(marr1, marr2, ARR_SIZE - 16);
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
236 v2 = read_tsc();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
237 t = GetTimer() - t;
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
238 // ARR_SIZE*100 / (1024*1024) / (t/1000000) = ARR_SIZE*95.36743 / t
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
239 printf("MMX2: CPU clocks=%llu = %dus (%5.3ffps) %5.1fMB/s\n", v2-v1, t,
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
240 100000000.0f/(float)t, (float)ARR_SIZE*95.36743f/(float)t);
28894
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
241 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
242
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
243 #if HAVE_SSE
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
244 t = GetTimer();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
245 v1 = read_tsc();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
246 for (i = 0; i < 100; i++)
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
247 fast_memcpy_SSE(marr1, marr2, ARR_SIZE - 16);
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
248 v2 = read_tsc();
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
249 t = GetTimer() - t;
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
250 // ARR_SIZE*100 / (1024*1024) / (t/1000000) = ARR_SIZE*95.36743 / t
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
251 printf("SSE: CPU clocks=%llu = %dus (%5.3ffps) %5.1fMB/s\n", v2-v1, t,
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
252 100000000.0f/(float)t, (float)ARR_SIZE*95.36743f/(float)t);
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
253 #endif
b29169fccda9 Fix and restructure fastmemcpybench. It is now one binary that runs all
diego
parents: 28871
diff changeset
254
28868
a10ddae3de31 whitespace cosmetics:
diego
parents: 28855
diff changeset
255 return 0;
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
256 }