Mercurial > mplayer.hg
annotate TOOLS/fastmemcpybench.c @ 28457:7d49f24cc18f
Drop the deprecated sws_scale_ordered() at the next major version
bump.
author | stefano |
---|---|
date | Sun, 08 Feb 2009 23:06:05 +0000 |
parents | 8df85ad26746 |
children | 07c168210a73 |
rev | line source |
---|---|
562
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
1 /* |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
2 fastmemcpybench.c used to benchmark fastmemcpy.h code from libvo. |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
3 |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
4 Note: this code can not be used on PentMMX-PII because they contain |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
5 a bug in rdtsc. For Intel processors since P6(PII) rdpmc should be used |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
6 instead. For PIII it's disputable and seems bug was fixed but I don't |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
7 tested it. |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
8 */ |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
9 |
28232
8df85ad26746
Add missing 'void' keyword to parameterless function declarations.
diego
parents:
27757
diff
changeset
|
10 /* According to Uoti this code is broken. */ |
8df85ad26746
Add missing 'void' keyword to parameterless function declarations.
diego
parents:
27757
diff
changeset
|
11 |
562
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
12 #include <stdio.h> |
572 | 13 #include <stdlib.h> |
14 #include <string.h> | |
15 #include <sys/ioctl.h> | |
16 #include <unistd.h> | |
17 #include <fcntl.h> | |
18 #include <sys/mman.h> | |
19 #include <sys/time.h> | |
13839 | 20 #include <inttypes.h> |
562
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
21 |
572 | 22 //#define ARR_SIZE 100000 |
23 #define ARR_SIZE (1024*768*2) | |
24 | |
27365
13c920fdf7f5
Change a bunch of video-output-specific preprocessor directives from a HAVE_
diego
parents:
26759
diff
changeset
|
25 #ifdef CONFIG_MGA |
572 | 26 |
17017 | 27 #include "drivers/mga_vid.h" |
572 | 28 |
29 static mga_vid_config_t mga_vid_config; | |
30 static unsigned char* frame=NULL; | |
31 static int f; | |
32 | |
28232
8df85ad26746
Add missing 'void' keyword to parameterless function declarations.
diego
parents:
27757
diff
changeset
|
33 static int mga_init(void) |
8df85ad26746
Add missing 'void' keyword to parameterless function declarations.
diego
parents:
27757
diff
changeset
|
34 { |
572 | 35 f = open("/dev/mga_vid",O_RDWR); |
36 if(f == -1) | |
37 { | |
38 fprintf(stderr,"Couldn't open /dev/mga_vid\n"); | |
26759
8eff880f638c
cosmetics: Remove useless parentheses from return statements.
diego
parents:
26575
diff
changeset
|
39 return -1; |
572 | 40 } |
41 | |
42 mga_vid_config.num_frames=1; | |
43 mga_vid_config.frame_size=ARR_SIZE; | |
44 mga_vid_config.format=MGA_VID_FORMAT_YUY2; | |
45 | |
46 mga_vid_config.colkey_on=0; | |
47 mga_vid_config.src_width = 640; | |
48 mga_vid_config.src_height= 480; | |
49 mga_vid_config.dest_width = 320; | |
50 mga_vid_config.dest_height= 200; | |
51 mga_vid_config.x_org= 0; | |
52 mga_vid_config.y_org= 0; | |
53 | |
54 mga_vid_config.version=MGA_VID_VERSION; | |
55 if (ioctl(f,MGA_VID_CONFIG,&mga_vid_config)) | |
56 { | |
57 perror("Error in mga_vid_config ioctl()"); | |
58 printf("Your mga_vid driver version is incompatible with this MPlayer version!\n"); | |
59 exit(1); | |
60 } | |
61 ioctl(f,MGA_VID_ON,0); | |
62 | |
63 frame = (char*)mmap(0,mga_vid_config.frame_size*mga_vid_config.num_frames,PROT_WRITE,MAP_SHARED,f,0); | |
64 if(!frame){ | |
65 printf("Can't mmap mga frame\n"); | |
66 exit(1); | |
67 } | |
68 | |
69 //clear the buffer | |
70 //memset(frames[0],0x80,mga_vid_config.frame_size*mga_vid_config.num_frames); | |
71 | |
72 return 0; | |
73 | |
74 } | |
75 | |
76 #endif | |
77 | |
78 // Returns current time in microseconds | |
28232
8df85ad26746
Add missing 'void' keyword to parameterless function declarations.
diego
parents:
27757
diff
changeset
|
79 static unsigned int GetTimer(void) |
8df85ad26746
Add missing 'void' keyword to parameterless function declarations.
diego
parents:
27757
diff
changeset
|
80 { |
572 | 81 struct timeval tv; |
82 struct timezone tz; | |
83 // float s; | |
84 gettimeofday(&tv,&tz); | |
85 // s=tv.tv_usec;s*=0.000001;s+=tv.tv_sec; | |
26759
8eff880f638c
cosmetics: Remove useless parentheses from return statements.
diego
parents:
26575
diff
changeset
|
86 return tv.tv_sec * 1000000 + tv.tv_usec; |
572 | 87 } |
562
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
88 |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
89 static inline unsigned long long int read_tsc( void ) |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
90 { |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
91 unsigned long long int retval; |
27757
b5a46071062a
Replace all occurrences of '__volatile__' and '__volatile' by plain 'volatile'.
diego
parents:
27754
diff
changeset
|
92 __asm__ volatile ("rdtsc":"=A"(retval)::"memory"); |
562
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
93 return retval; |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
94 } |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
95 |
3076
bfc881c0e591
newly allocated memory seems to point to only 1 zero filled 4k page or something so there is a near 100% cache hit rate ... not very realistic, writeing something in the source array fixes that so the benchmark scores are meaningfull now
michael
parents:
687
diff
changeset
|
96 unsigned char __attribute__((aligned(4096)))arr1[ARR_SIZE],arr2[ARR_SIZE]; |
562
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
97 |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
98 int main( void ) |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
99 { |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
100 unsigned long long int v1,v2; |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
101 unsigned char * marr1,*marr2; |
572 | 102 int i; |
103 unsigned int t; | |
27365
13c920fdf7f5
Change a bunch of video-output-specific preprocessor directives from a HAVE_
diego
parents:
26759
diff
changeset
|
104 #ifdef CONFIG_MGA |
572 | 105 mga_init(); |
106 marr1 = &frame[3]; | |
107 #else | |
3081 | 108 marr1 = &arr1[3]; |
572 | 109 #endif |
3081 | 110 marr2 = &arr2[9]; |
3076
bfc881c0e591
newly allocated memory seems to point to only 1 zero filled 4k page or something so there is a near 100% cache hit rate ... not very realistic, writeing something in the source array fixes that so the benchmark scores are meaningfull now
michael
parents:
687
diff
changeset
|
111 |
3082 | 112 for(i=0; i<ARR_SIZE-16; i++) marr1[i] = marr2[i] = i; |
3076
bfc881c0e591
newly allocated memory seems to point to only 1 zero filled 4k page or something so there is a near 100% cache hit rate ... not very realistic, writeing something in the source array fixes that so the benchmark scores are meaningfull now
michael
parents:
687
diff
changeset
|
113 |
572 | 114 t=GetTimer(); |
562
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
115 v1 = read_tsc(); |
572 | 116 for(i=0;i<100;i++) memcpy(marr1,marr2,ARR_SIZE-16); |
562
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
117 v2 = read_tsc(); |
572 | 118 t=GetTimer()-t; |
119 // ARR_SIZE*100/(1024*1024)/(t/1000000) = ARR_SIZE*95.36743/t | |
687 | 120 printf(NAME": cpu clocks=%llu = %dus (%5.3ffps) %5.1fMB/s\n",v2-v1,t,100000000.0f/(float)t,(float)ARR_SIZE*95.36743f/(float)t); |
562
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
121 return 0; |
312fee2a6816
Initial release, used to benchmark fastmemcpy.h code from libvo.
atmosfear
parents:
diff
changeset
|
122 } |