Mercurial > mplayer.hg
view TOOLS/fastmemcpybench.c @ 28871:5643b5e6bee0
Make fastmemcpybench almost working - only thing missing is a way to
override HAVE_MMX etc. from config.h.
author | reimar |
---|---|
date | Mon, 09 Mar 2009 12:59:14 +0000 |
parents | 04a232eb5f0d |
children | b29169fccda9 |
line wrap: on
line source
/* * benchmark tool for fast_memcpy code from libvo * * NOTE: This code can not be used on Pentium MMX / II because they contain * a bug in rdtsc. For Intel processors since P6(PII) rdpmc should be used * instead. For PIII it's disputable and it seems the bug was fixed but this * was not confirmed through testing. */ /* According to Uoti this code is broken. */ #include <stdio.h> #include <stdlib.h> #include <string.h> #include <sys/ioctl.h> #include <unistd.h> #include <fcntl.h> #include <sys/mman.h> #include <sys/time.h> #include <inttypes.h> #include "libvo/fastmemcpy.h" //#define ARR_SIZE 100000 #define ARR_SIZE (1024*768*2) #ifdef CONFIG_MGA #include "drivers/mga_vid.h" static mga_vid_config_t mga_vid_config; static unsigned char* frame = NULL; static int f; static int mga_init(void) { f = open("/dev/mga_vid", O_RDWR); if (f == -1) { fprintf(stderr, "Couldn't open /dev/mga_vid.\n"); return -1; } mga_vid_config.num_frames = 1; mga_vid_config.frame_size = ARR_SIZE; mga_vid_config.format = MGA_VID_FORMAT_YUY2; mga_vid_config.colkey_on = 0; mga_vid_config.src_width = 640; mga_vid_config.src_height = 480; mga_vid_config.dest_width = 320; mga_vid_config.dest_height = 200; mga_vid_config.x_org = 0; mga_vid_config.y_org = 0; mga_vid_config.version = MGA_VID_VERSION; if (ioctl(f, MGA_VID_CONFIG, &mga_vid_config)) { perror("Error in mga_vid_config ioctl()"); printf("Your mga_vid driver version is incompatible with this MPlayer version!\n"); exit(1); } ioctl(f, MGA_VID_ON, 0); frame = (char*)mmap(0, mga_vid_config.frame_size*mga_vid_config.num_frames, PROT_WRITE,MAP_SHARED, f, 0); if (!frame) { printf("Can't mmap MGA frame.\n"); exit(1); } //clear the buffer //memset(frames[0], 0x80, mga_vid_config.frame_size*mga_vid_config.num_frames); return 0; } #endif // Returns current time in microseconds static unsigned int GetTimer(void) { struct timeval tv; struct timezone tz; //float s; gettimeofday(&tv, &tz); //s = tv.tv_usec; s *= 0.000001; s += tv.tv_sec; return tv.tv_sec * 1000000 + tv.tv_usec; } static inline unsigned long long int read_tsc(void) { unsigned long long int retval; __asm__ volatile ("rdtsc":"=A" (retval)::"memory"); return retval; } unsigned char __attribute__((aligned(4096)))arr1[ARR_SIZE], arr2[ARR_SIZE]; int main(void) { unsigned long long int v1, v2; unsigned char *marr1, *marr2; int i; unsigned int t; #ifdef CONFIG_MGA mga_init(); marr1 = &frame[3]; #else marr1 = &arr1[0]; #endif marr2 = &arr2[0]; for (i = 0; i < ARR_SIZE - 16; i++) marr1[i] = marr2[i] = i; t = GetTimer(); v1 = read_tsc(); for (i = 0; i < 100; i++) fast_memcpy(marr1, marr2, ARR_SIZE - 16); v2 = read_tsc(); t = GetTimer() - t; // ARR_SIZE*100 / (1024*1024) / (t/1000000) = ARR_SIZE*95.36743 / t printf(NAME ": CPU clocks=%llu = %dus (%5.3ffps) %5.1fMB/s\n", v2-v1, t, 100000000.0f/(float)t, (float)ARR_SIZE*95.36743f/(float)t); return 0; }