annotate libmpcodecs/vf_yvu9.c @ 35584:fb92c6de7f70

Reduce register usage in an asm block. Reduce to 4 registers in an asm block of render_frame_yuv420p_sse4 with simplification of code. After the modification, this function can still be ~3.5x faster than render_frame_yuv420p.
author upsuper
date Fri, 14 Dec 2012 02:16:30 +0000
parents 7af3e6f901fd
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
30421
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
1 /*
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
2 * This file is part of MPlayer.
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
3 *
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
4 * MPlayer is free software; you can redistribute it and/or modify
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
5 * it under the terms of the GNU General Public License as published by
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
6 * the Free Software Foundation; either version 2 of the License, or
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
7 * (at your option) any later version.
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
8 *
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
9 * MPlayer is distributed in the hope that it will be useful,
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
12 * GNU General Public License for more details.
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
13 *
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
14 * You should have received a copy of the GNU General Public License along
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
15 * with MPlayer; if not, write to the Free Software Foundation, Inc.,
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
16 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
17 */
bbb6ebec87a0 Add missing license headers to all files in the libmpcodecs directory.
diego
parents: 29263
diff changeset
18
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
19 #include <stdio.h>
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
20 #include <stdlib.h>
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
21 #include <string.h>
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
22 #include <inttypes.h>
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
23
17012
6ff3379a0862 Unify include path handling, -I.. is in CFLAGS.
diego
parents: 9934
diff changeset
24 #include "config.h"
6ff3379a0862 Unify include path handling, -I.. is in CFLAGS.
diego
parents: 9934
diff changeset
25 #include "mp_msg.h"
18004
bcd805923554 Part2 of several printf2mp_msg changes in patch from Otvos Attila oattila AT chello DOT hu with LOTS of modifications by me
reynaldo
parents: 17906
diff changeset
26 #include "help_mp.h"
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
27
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
28 #include "img_format.h"
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
29 #include "mp_image.h"
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
30 #include "vf.h"
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
31
17012
6ff3379a0862 Unify include path handling, -I.. is in CFLAGS.
diego
parents: 9934
diff changeset
32 #include "libvo/fastmemcpy.h"
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
33
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
34 //===========================================================================//
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
35
30642
a972c1a4a012 cosmetics: Rename struct vf_instance_s --> vf_instance.
diego
parents: 30638
diff changeset
36 static int config(struct vf_instance *vf,
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
37 int width, int height, int d_width, int d_height,
32702
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
38 unsigned int flags, unsigned int outfmt){
29263
0f1b5b68af32 whitespace cosmetics: Remove all trailing whitespace.
diego
parents: 25221
diff changeset
39
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
40 if(vf_next_query_format(vf,IMGFMT_YV12)<=0){
32702
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
41 mp_msg(MSGT_VFILTER, MSGL_WARN, MSGTR_MPCODECS_WarnNextFilterDoesntSupport, "YVU9");
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
42 return 0;
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
43 }
29263
0f1b5b68af32 whitespace cosmetics: Remove all trailing whitespace.
diego
parents: 25221
diff changeset
44
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
45 return vf_next_config(vf,width,height,d_width,d_height,flags,IMGFMT_YV12);
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
46 }
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
47
30642
a972c1a4a012 cosmetics: Rename struct vf_instance_s --> vf_instance.
diego
parents: 30638
diff changeset
48 static int put_image(struct vf_instance *vf, mp_image_t *mpi, double pts){
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
49 mp_image_t *dmpi;
6504
11c0ddb83168 use built-in yvu9->yv12 code, because it requires all src/dst strides and
arpi
parents: 6485
diff changeset
50 int y,w,h;
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
51
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
52 // hope we'll get DR buffer:
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
53 dmpi=vf_get_image(vf->next,IMGFMT_YV12,
32702
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
54 MP_IMGTYPE_TEMP, 0/*MP_IMGFLAG_ACCEPT_STRIDE*/,
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
55 mpi->w, mpi->h);
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
56
6504
11c0ddb83168 use built-in yvu9->yv12 code, because it requires all src/dst strides and
arpi
parents: 6485
diff changeset
57 for(y=0;y<mpi->h;y++)
32702
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
58 fast_memcpy(dmpi->planes[0]+dmpi->stride[0]*y,
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
59 mpi->planes[0]+mpi->stride[0]*y,
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
60 mpi->w);
6504
11c0ddb83168 use built-in yvu9->yv12 code, because it requires all src/dst strides and
arpi
parents: 6485
diff changeset
61
11c0ddb83168 use built-in yvu9->yv12 code, because it requires all src/dst strides and
arpi
parents: 6485
diff changeset
62 w=mpi->w/4; h=mpi->h/2;
11c0ddb83168 use built-in yvu9->yv12 code, because it requires all src/dst strides and
arpi
parents: 6485
diff changeset
63 for(y=0;y<h;y++){
32702
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
64 unsigned char* s=mpi->planes[1]+mpi->stride[1]*(y>>1);
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
65 unsigned char* d=dmpi->planes[1]+dmpi->stride[1]*y;
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
66 int x;
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
67 for(x=0;x<w;x++) d[2*x]=d[2*x+1]=s[x];
6504
11c0ddb83168 use built-in yvu9->yv12 code, because it requires all src/dst strides and
arpi
parents: 6485
diff changeset
68 }
11c0ddb83168 use built-in yvu9->yv12 code, because it requires all src/dst strides and
arpi
parents: 6485
diff changeset
69 for(y=0;y<h;y++){
32702
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
70 unsigned char* s=mpi->planes[2]+mpi->stride[2]*(y>>1);
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
71 unsigned char* d=dmpi->planes[2]+dmpi->stride[2]*y;
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
72 int x;
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
73 for(x=0;x<w;x++) d[2*x]=d[2*x+1]=s[x];
6504
11c0ddb83168 use built-in yvu9->yv12 code, because it requires all src/dst strides and
arpi
parents: 6485
diff changeset
74 }
11c0ddb83168 use built-in yvu9->yv12 code, because it requires all src/dst strides and
arpi
parents: 6485
diff changeset
75
9934
89da8ec89558 vf_clone_mpi_attributes()
michael
parents: 9593
diff changeset
76 vf_clone_mpi_attributes(dmpi, mpi);
29263
0f1b5b68af32 whitespace cosmetics: Remove all trailing whitespace.
diego
parents: 25221
diff changeset
77
17906
20aca9baf5d8 passing pts through the filter layer (lets see if pts or cola comes out at the end)
michael
parents: 17012
diff changeset
78 return vf_next_put_image(vf,dmpi, pts);
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
79 }
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
80
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
81 //===========================================================================//
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
82
30642
a972c1a4a012 cosmetics: Rename struct vf_instance_s --> vf_instance.
diego
parents: 30638
diff changeset
83 static int query_format(struct vf_instance *vf, unsigned int fmt){
6524
05cd2cf758e4 if09 support
alex
parents: 6504
diff changeset
84 if (fmt == IMGFMT_YVU9 || fmt == IMGFMT_IF09)
32702
7af3e6f901fd Convert some tabs to whitespace to allow using MPlayer filter sourcecode in FFmpeg.
cehoyos
parents: 30642
diff changeset
85 return vf_next_query_format(vf,IMGFMT_YV12) & (~VFCAP_CSP_SUPPORTED_BY_HW);
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
86 return 0;
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
87 }
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
88
30638
a7b908875c14 Rename open() vf initialization function to vf_open().
diego
parents: 30421
diff changeset
89 static int vf_open(vf_instance_t *vf, char *args){
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
90 vf->config=config;
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
91 vf->put_image=put_image;
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
92 vf->query_format=query_format;
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
93 return 1;
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
94 }
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
95
25221
00fff9a3b735 Make all vf_info_t structs const
reimar
parents: 23457
diff changeset
96 const vf_info_t vf_info_yvu9 = {
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
97 "fast YVU9->YV12 conversion",
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
98 "yvu9",
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
99 "alex",
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
100 "",
30638
a7b908875c14 Rename open() vf initialization function to vf_open().
diego
parents: 30421
diff changeset
101 vf_open,
9593
e9a2af584986 Add the new -vf option wich is the same as vop in reverse order.
albeu
parents: 7368
diff changeset
102 NULL
6485
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
103 };
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
104
52563321dc78 yvu9toyv12 converter
alex
parents:
diff changeset
105 //===========================================================================//