comparison libmpcodecs/ae_lame.c @ 15234:e84a6ae9d51e

audio encoding reworked
author nicodvb
date Fri, 22 Apr 2005 06:59:59 +0000
parents
children 2cc48c37a7eb
comparison
equal deleted inserted replaced
15233:e18a07d6badb 15234:e84a6ae9d51e
1 #include <stdio.h>
2 #include <stdlib.h>
3 #include <inttypes.h>
4 #include <string.h>
5 #include "m_option.h"
6 #include "../mp_msg.h"
7 #include "aviheader.h"
8 #include "ms_hdr.h"
9 #include "muxer.h"
10 #include "../help_mp.h"
11 #include "ae_pcm.h"
12 #include "../libaf/af_format.h"
13 #include "../libmpdemux/mp3_hdr.h"
14
15 #undef CDECL
16 #include <lame/lame.h>
17
18 lame_global_flags *lame;
19 static int lame_param_quality=0; // best
20 static int lame_param_algqual=5; // same as old default
21 static int lame_param_vbr=vbr_default;
22 static int lame_param_mode=-1; // unset
23 static int lame_param_padding=-1; // unset
24 static int lame_param_br=-1; // unset
25 static int lame_param_ratio=-1; // unset
26 static float lame_param_scale=-1; // unset
27 static int lame_param_lowpassfreq = 0; //auto
28 static int lame_param_highpassfreq = 0; //auto
29 static int lame_param_free_format = 0; //disabled
30 static int lame_param_br_min = 0; //not specified
31 static int lame_param_br_max = 0; //not specified
32
33 #if HAVE_MP3LAME >= 392
34 int lame_param_fast=0; // unset
35 static char* lame_param_preset=NULL; // unset
36 static int lame_presets_set( lame_t gfp, int fast, int cbr, const char* preset_name );
37 static void lame_presets_longinfo_dm ( FILE* msgfp );
38 #endif
39
40
41 m_option_t lameopts_conf[]={
42 {"q", &lame_param_quality, CONF_TYPE_INT, CONF_RANGE, 0, 9, NULL},
43 {"aq", &lame_param_algqual, CONF_TYPE_INT, CONF_RANGE, 0, 9, NULL},
44 {"vbr", &lame_param_vbr, CONF_TYPE_INT, CONF_RANGE, 0, vbr_max_indicator, NULL},
45 {"cbr", &lame_param_vbr, CONF_TYPE_FLAG, 0, 0, 0, NULL},
46 {"abr", &lame_param_vbr, CONF_TYPE_FLAG, 0, 0, vbr_abr, NULL},
47 {"mode", &lame_param_mode, CONF_TYPE_INT, CONF_RANGE, 0, MAX_INDICATOR, NULL},
48 {"padding", &lame_param_padding, CONF_TYPE_INT, CONF_RANGE, 0, PAD_MAX_INDICATOR, NULL},
49 {"br", &lame_param_br, CONF_TYPE_INT, CONF_RANGE, 0, 1024, NULL},
50 {"ratio", &lame_param_ratio, CONF_TYPE_INT, CONF_RANGE, 0, 100, NULL},
51 {"vol", &lame_param_scale, CONF_TYPE_FLOAT, CONF_RANGE, 0, 10, NULL},
52 {"lowpassfreq",&lame_param_lowpassfreq, CONF_TYPE_INT, CONF_RANGE, -1, 48000,0},
53 {"highpassfreq",&lame_param_highpassfreq, CONF_TYPE_INT, CONF_RANGE, -1, 48000,0},
54 {"nofree", &lame_param_free_format, CONF_TYPE_FLAG, 0, 0, 0, NULL},
55 {"free", &lame_param_free_format, CONF_TYPE_FLAG, 0, 0, 1, NULL},
56 {"br_min", &lame_param_br_min, CONF_TYPE_INT, CONF_RANGE, 0, 1024, NULL},
57 {"br_max", &lame_param_br_max, CONF_TYPE_INT, CONF_RANGE, 0, 1024, NULL},
58 #if HAVE_MP3LAME >= 392
59 {"fast", &lame_param_fast, CONF_TYPE_FLAG, 0, 0, 1, NULL},
60 {"preset", &lame_param_preset, CONF_TYPE_STRING, 0, 0, 0, NULL},
61 #else
62 {"fast", "MPlayer was built without -lameopts fast support (requires libmp3lame >=3.92).\n", CONF_TYPE_PRINT, CONF_NOCFG, 0, 0, NULL},
63 {"preset", "MPlayer was built without -lameopts preset support (requires libmp3lame >=3.92).\n", CONF_TYPE_PRINT, CONF_NOCFG, 0, 0, NULL},
64 #endif
65 {"help", MSGTR_MEncoderMP3LameHelp, CONF_TYPE_PRINT, CONF_NOCFG, 0, 0, NULL},
66 {NULL, NULL, 0, 0, 0, 0, NULL}
67 };
68
69
70 static int pass;
71 extern int verbose;
72
73 static int bind_lame(audio_encoder_t *encoder, muxer_stream_t *mux_a)
74 {
75 mp_msg(MSGT_FIXME, MSGL_FIXME, MSGTR_MP3AudioSelected);
76 mux_a->h.dwSampleSize=0; // VBR
77 mux_a->h.dwRate=encoder->params.sample_rate;
78 mux_a->h.dwScale=encoder->params.samples_per_frame; // samples/frame
79 if(sizeof(MPEGLAYER3WAVEFORMAT)!=30) mp_msg(MSGT_MENCODER,MSGL_WARN,MSGTR_MP3WaveFormatSizeNot30,sizeof(MPEGLAYER3WAVEFORMAT));
80 mux_a->wf=malloc(sizeof(MPEGLAYER3WAVEFORMAT)); // should be 30
81 mux_a->wf->wFormatTag=0x55; // MP3
82 mux_a->wf->nChannels= (lame_param_mode<0) ? encoder->params.channels : ((lame_param_mode==3) ? 1 : 2);
83 mux_a->wf->nSamplesPerSec=mux_a->h.dwRate;
84 if(! lame_param_vbr)
85 mux_a->wf->nAvgBytesPerSec=lame_param_br * 125;
86 else
87 mux_a->wf->nAvgBytesPerSec=192000/8; // FIXME!
88 mux_a->wf->nBlockAlign=encoder->params.samples_per_frame; // required for l3codeca.acm + WMP 6.4
89 mux_a->wf->wBitsPerSample=0; //16;
90 // from NaNdub: (requires for l3codeca.acm)
91 mux_a->wf->cbSize=12;
92 ((MPEGLAYER3WAVEFORMAT*)(mux_a->wf))->wID=1;
93 ((MPEGLAYER3WAVEFORMAT*)(mux_a->wf))->fdwFlags=2;
94 ((MPEGLAYER3WAVEFORMAT*)(mux_a->wf))->nBlockSize=encoder->params.samples_per_frame; // ???
95 ((MPEGLAYER3WAVEFORMAT*)(mux_a->wf))->nFramesPerBlock=1;
96 ((MPEGLAYER3WAVEFORMAT*)(mux_a->wf))->nCodecDelay=0;
97
98 encoder->input_format = AF_FORMAT_S16_LE;
99 encoder->min_buffer_size = 4608;
100 encoder->max_buffer_size = mux_a->h.dwRate * mux_a->wf->nChannels * 2;
101
102 return 1;
103 }
104
105 #define min(a, b) ((a) <= (b) ? (a) : (b))
106
107 static int get_frame_size(audio_encoder_t *encoder)
108 {
109 int sz;
110 if(encoder->stream->buffer_len < 4)
111 return 0;
112 sz = mp_decode_mp3_header(encoder->stream->buffer);
113 if(sz <= 0)
114 return 0;
115 return sz;
116 }
117
118 static int encode_lame(audio_encoder_t *encoder, uint8_t *dest, void *src, int len, int max_size)
119 {
120 int n = 0;
121 if(encoder->params.channels == 1)
122 n = lame_encode_buffer(lame, (short *)src, (short *)src, len/2, dest, max_size);
123 else
124 n = lame_encode_buffer_interleaved(lame,(short *)src, len/4, dest, max_size);
125
126 return (n < 0 ? 0 : n);
127 }
128
129
130 static int close_lame(audio_encoder_t *encoder)
131 {
132 return 1;
133 }
134
135 static void fixup(audio_encoder_t *encoder)
136 {
137 // fixup CBR mp3 audio header:
138 if(!lame_param_vbr) {
139 encoder->stream->h.dwSampleSize=1;
140 ((MPEGLAYER3WAVEFORMAT*)(encoder->stream->wf))->nBlockSize=
141 (encoder->stream->size+(encoder->stream->h.dwLength>>1))/encoder->stream->h.dwLength;
142 encoder->stream->h.dwLength=encoder->stream->size;
143 encoder->stream->h.dwRate=encoder->stream->wf->nAvgBytesPerSec;
144 encoder->stream->h.dwScale=1;
145 encoder->stream->wf->nBlockAlign=1;
146 mp_msg(MSGT_FIXME, MSGL_FIXME, MSGTR_CBRAudioByterate,
147 encoder->stream->h.dwRate,((MPEGLAYER3WAVEFORMAT*)(encoder->stream->wf))->nBlockSize);
148 }
149 }
150
151 int mpae_init_lame(audio_encoder_t *encoder)
152 {
153 encoder->params.bitrate = lame_param_br * 125;
154 encoder->params.samples_per_frame = encoder->params.sample_rate < 32000 ? 576 : 1152;
155 encoder->decode_buffer_size = 2304;
156
157 lame=lame_init();
158 lame_set_bWriteVbrTag(lame,0);
159 lame_set_in_samplerate(lame,encoder->params.sample_rate);
160 //lame_set_in_samplerate(lame,sh_audio->samplerate); // if resampling done by lame
161 lame_set_num_channels(lame,encoder->params.channels);
162 lame_set_out_samplerate(lame,encoder->params.sample_rate);
163 lame_set_quality(lame,lame_param_algqual); // 0 = best q
164 if(lame_param_free_format) lame_set_free_format(lame,1);
165 if(lame_param_vbr){ // VBR:
166 lame_set_VBR(lame,lame_param_vbr); // vbr mode
167 lame_set_VBR_q(lame,lame_param_quality); // 0 = best vbr q 5=~128k
168 if(lame_param_br>0) lame_set_VBR_mean_bitrate_kbps(lame,lame_param_br);
169 if(lame_param_br_min>0) lame_set_VBR_min_bitrate_kbps(lame,lame_param_br_min);
170 if(lame_param_br_max>0) lame_set_VBR_max_bitrate_kbps(lame,lame_param_br_max);
171 } else { // CBR:
172 if(lame_param_br>0) lame_set_brate(lame,lame_param_br);
173 }
174 if(lame_param_mode>=0) lame_set_mode(lame,lame_param_mode); // j-st
175 if(lame_param_ratio>0) lame_set_compression_ratio(lame,lame_param_ratio);
176 if(lame_param_scale>0) {
177 mp_msg(MSGT_FIXME, MSGL_FIXME, MSGTR_SettingAudioInputGain, lame_param_scale);
178 lame_set_scale(lame,lame_param_scale);
179 }
180 if(lame_param_lowpassfreq>=-1) lame_set_lowpassfreq(lame,lame_param_lowpassfreq);
181 if(lame_param_highpassfreq>=-1) lame_set_highpassfreq(lame,lame_param_highpassfreq);
182 #if HAVE_MP3LAME >= 392
183 if(lame_param_preset != NULL) {
184 mp_msg(MSGT_FIXME, MSGL_FIXME, MSGTR_LamePresetEquals,lame_param_preset);
185 if(lame_presets_set(lame,lame_param_fast, (lame_param_vbr==0), lame_param_preset) < 0)
186 return 0;
187 }
188 #endif
189 if(lame_init_params(lame) == -1) {
190 mp_msg(MSGT_MENCODER, MSGL_FATAL, MSGTR_LameCantInit);
191 return 0;
192 }
193 if(verbose>0) {
194 lame_print_config(lame);
195 lame_print_internals(lame);
196 }
197
198 encoder->bind = bind_lame;
199 encoder->get_frame_size = get_frame_size;
200 encoder->encode = encode_lame;
201 encoder->fixup = fixup;
202 encoder->close = close_lame;
203 return 1;
204 }
205
206 #if HAVE_MP3LAME >= 392
207 /* lame_presets_set
208 taken out of presets_set in lame-3.93.1/frontend/parse.c and modified */
209 static int lame_presets_set( lame_t gfp, int fast, int cbr, const char* preset_name )
210 {
211 int mono = 0;
212
213 if (strcmp(preset_name, "help") == 0) {
214 mp_msg(MSGT_FIXME, MSGL_FIXME, MSGTR_LameVersion, get_lame_version(), get_lame_url());
215 lame_presets_longinfo_dm(stderr);
216 return -1;
217 }
218
219 //aliases for compatibility with old presets
220
221 if (strcmp(preset_name, "phone") == 0) {
222 preset_name = "16";
223 mono = 1;
224 }
225 if ( (strcmp(preset_name, "phon+") == 0) ||
226 (strcmp(preset_name, "lw") == 0) ||
227 (strcmp(preset_name, "mw-eu") == 0) ||
228 (strcmp(preset_name, "sw") == 0)) {
229 preset_name = "24";
230 mono = 1;
231 }
232 if (strcmp(preset_name, "mw-us") == 0) {
233 preset_name = "40";
234 mono = 1;
235 }
236 if (strcmp(preset_name, "voice") == 0) {
237 preset_name = "56";
238 mono = 1;
239 }
240 if (strcmp(preset_name, "fm") == 0) {
241 preset_name = "112";
242 }
243 if ( (strcmp(preset_name, "radio") == 0) ||
244 (strcmp(preset_name, "tape") == 0)) {
245 preset_name = "112";
246 }
247 if (strcmp(preset_name, "hifi") == 0) {
248 preset_name = "160";
249 }
250 if (strcmp(preset_name, "cd") == 0) {
251 preset_name = "192";
252 }
253 if (strcmp(preset_name, "studio") == 0) {
254 preset_name = "256";
255 }
256
257 #if HAVE_MP3LAME >= 393
258 if (strcmp(preset_name, "medium") == 0) {
259 if (fast > 0)
260 lame_set_preset(gfp, MEDIUM_FAST);
261 else
262 lame_set_preset(gfp, MEDIUM);
263
264 return 0;
265 }
266 #endif
267
268 if (strcmp(preset_name, "standard") == 0) {
269 if (fast > 0)
270 lame_set_preset(gfp, STANDARD_FAST);
271 else
272 lame_set_preset(gfp, STANDARD);
273
274 return 0;
275 }
276
277 else if (strcmp(preset_name, "extreme") == 0){
278 if (fast > 0)
279 lame_set_preset(gfp, EXTREME_FAST);
280 else
281 lame_set_preset(gfp, EXTREME);
282
283 return 0;
284 }
285
286 else if (((strcmp(preset_name, "insane") == 0) ||
287 (strcmp(preset_name, "320" ) == 0)) && (fast < 1)) {
288
289 lame_set_preset(gfp, INSANE);
290
291 return 0;
292 }
293
294 // Generic ABR Preset
295 if (((atoi(preset_name)) > 0) && (fast < 1)) {
296 if ((atoi(preset_name)) >= 8 && (atoi(preset_name)) <= 320){
297 lame_set_preset(gfp, atoi(preset_name));
298
299 if (cbr == 1 )
300 lame_set_VBR(gfp, vbr_off);
301
302 if (mono == 1 ) {
303 lame_set_mode(gfp, MONO);
304 }
305
306 return 0;
307
308 }
309 else {
310 mp_msg(MSGT_FIXME, MSGL_FIXME, MSGTR_LameVersion, get_lame_version(), get_lame_url());
311 mp_msg(MSGT_FIXME, MSGL_FIXME, MSGTR_InvalidBitrateForLamePreset);
312 return -1;
313 }
314 }
315
316 mp_msg(MSGT_FIXME, MSGL_FIXME, MSGTR_LameVersion, get_lame_version(), get_lame_url());
317 mp_msg(MSGT_FIXME, MSGL_FIXME, MSGTR_InvalidLamePresetOptions);
318 return -1;
319 }
320 #endif
321
322 #if HAVE_MP3LAME >= 392
323 /* lame_presets_longinfo_dm
324 taken out of presets_longinfo_dm in lame-3.93.1/frontend/parse.c and modified */
325 static void lame_presets_longinfo_dm ( FILE* msgfp )
326 {
327 mp_msg(MSGT_FIXME, MSGL_FIXME, MSGTR_LamePresetsLongInfo);
328 }
329 #endif