annotate TOOLS/fastmemcpybench.c @ 15231:e183a591efee

More fixes by The Wanderer
author rtognimp
date Wed, 20 Apr 2005 22:07:08 +0000
parents 40391656ae23
children dd053aeb5442
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
1 /*
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
2 fastmemcpybench.c used to benchmark fastmemcpy.h code from libvo.
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
3
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
4 Note: this code can not be used on PentMMX-PII because they contain
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
5 a bug in rdtsc. For Intel processors since P6(PII) rdpmc should be used
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
6 instead. For PIII it's disputable and seems bug was fixed but I don't
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
7 tested it.
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
8 */
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
9
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
10 #include <stdio.h>
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
11 #include <stdlib.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
12 #include <string.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
13 #include <sys/ioctl.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
14 #include <unistd.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
15 #include <fcntl.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
16 #include <sys/mman.h>
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
17 #include <sys/time.h>
13839
40391656ae23 small compilation fix
rathann
parents: 3082
diff changeset
18 #include <inttypes.h>
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
19
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
20 #include "../libvo/fastmemcpy.h"
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
21
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
22 //#define ARR_SIZE 100000
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
23 #define ARR_SIZE (1024*768*2)
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
24
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
25 #ifdef HAVE_MGA
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
26
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
27 #include "../drivers/mga_vid.h"
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
28
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
29 static int mga_next_frame=0;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
30
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
31 static mga_vid_config_t mga_vid_config;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
32 static unsigned char* frame=NULL;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
33 static int f;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
34
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
35 static int mga_init(){
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
36 char *frame_mem;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
37
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
38 f = open("/dev/mga_vid",O_RDWR);
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
39 if(f == -1)
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
40 {
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
41 fprintf(stderr,"Couldn't open /dev/mga_vid\n");
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
42 return(-1);
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
43 }
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
44
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
45 mga_vid_config.num_frames=1;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
46 mga_vid_config.frame_size=ARR_SIZE;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
47 mga_vid_config.format=MGA_VID_FORMAT_YUY2;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
48
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
49 mga_vid_config.colkey_on=0;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
50 mga_vid_config.src_width = 640;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
51 mga_vid_config.src_height= 480;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
52 mga_vid_config.dest_width = 320;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
53 mga_vid_config.dest_height= 200;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
54 mga_vid_config.x_org= 0;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
55 mga_vid_config.y_org= 0;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
56
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
57 mga_vid_config.version=MGA_VID_VERSION;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
58 if (ioctl(f,MGA_VID_CONFIG,&mga_vid_config))
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
59 {
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
60 perror("Error in mga_vid_config ioctl()");
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
61 printf("Your mga_vid driver version is incompatible with this MPlayer version!\n");
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
62 exit(1);
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
63 }
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
64 ioctl(f,MGA_VID_ON,0);
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
65
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
66 frame = (char*)mmap(0,mga_vid_config.frame_size*mga_vid_config.num_frames,PROT_WRITE,MAP_SHARED,f,0);
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
67 if(!frame){
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
68 printf("Can't mmap mga frame\n");
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
69 exit(1);
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
70 }
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
71
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
72 //clear the buffer
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
73 //memset(frames[0],0x80,mga_vid_config.frame_size*mga_vid_config.num_frames);
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
74
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
75 return 0;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
76
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
77 }
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
78
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
79 #endif
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
80
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
81 // Returns current time in microseconds
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
82 unsigned int GetTimer(){
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
83 struct timeval tv;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
84 struct timezone tz;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
85 // float s;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
86 gettimeofday(&tv,&tz);
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
87 // s=tv.tv_usec;s*=0.000001;s+=tv.tv_sec;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
88 return (tv.tv_sec*1000000+tv.tv_usec);
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
89 }
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
90
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
91 static inline unsigned long long int read_tsc( void )
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
92 {
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
93 unsigned long long int retval;
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
94 __asm __volatile ("rdtsc":"=A"(retval)::"memory");
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
95 return retval;
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
96 }
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
97
3076
bfc881c0e591 newly allocated memory seems to point to only 1 zero filled 4k page or something so there is a near 100% cache hit rate ... not very realistic, writeing something in the source array fixes that so the benchmark scores are meaningfull now
michael
parents: 687
diff changeset
98 unsigned char __attribute__((aligned(4096)))arr1[ARR_SIZE],arr2[ARR_SIZE];
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
99
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
100 int main( void )
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
101 {
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
102 unsigned long long int v1,v2;
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
103 unsigned char * marr1,*marr2;
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
104 int i;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
105 unsigned int t;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
106 #ifdef HAVE_MGA
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
107 mga_init();
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
108 marr1 = &frame[3];
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
109 #else
3081
aa361482f2f1 missaligned arrays, as nick requested
michael
parents: 3076
diff changeset
110 marr1 = &arr1[3];
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
111 #endif
3081
aa361482f2f1 missaligned arrays, as nick requested
michael
parents: 3076
diff changeset
112 marr2 = &arr2[9];
3076
bfc881c0e591 newly allocated memory seems to point to only 1 zero filled 4k page or something so there is a near 100% cache hit rate ... not very realistic, writeing something in the source array fixes that so the benchmark scores are meaningfull now
michael
parents: 687
diff changeset
113
3082
michael
parents: 3081
diff changeset
114 for(i=0; i<ARR_SIZE-16; i++) marr1[i] = marr2[i] = i;
3076
bfc881c0e591 newly allocated memory seems to point to only 1 zero filled 4k page or something so there is a near 100% cache hit rate ... not very realistic, writeing something in the source array fixes that so the benchmark scores are meaningfull now
michael
parents: 687
diff changeset
115
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
116 t=GetTimer();
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
117 v1 = read_tsc();
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
118 for(i=0;i<100;i++) memcpy(marr1,marr2,ARR_SIZE-16);
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
119 v2 = read_tsc();
572
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
120 t=GetTimer()-t;
9935c60a15a0 added mga_vid support (systemram->videoram tests)
arpi_esp
parents: 562
diff changeset
121 // ARR_SIZE*100/(1024*1024)/(t/1000000) = ARR_SIZE*95.36743/t
687
bcb46c9eaae1 slight proofreading
nickols_k
parents: 572
diff changeset
122 printf(NAME": cpu clocks=%llu = %dus (%5.3ffps) %5.1fMB/s\n",v2-v1,t,100000000.0f/(float)t,(float)ARR_SIZE*95.36743f/(float)t);
562
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
123 return 0;
312fee2a6816 Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff changeset
124 }