Mercurial > mplayer.hg
view libmpdemux/demux_mov.c @ 34355:316f6edb49de
Avoid double conversion from utf16/ucs2 to utf8 for text subtitles.
There is code that auto-detects utf16 encoding of the subtitle stream
and forces the reading functions to convert it to native utf8.
The bug happens when using enca to (correctly) guess that the input
file has ucs2 encoding and tries to convert the input stream to utf8, again.
In my case iconv did not accept the input and discarded the subtitles
completely.
author | iive |
---|---|
date | Wed, 14 Dec 2011 00:17:49 +0000 |
parents | b6636da71bea |
children | 425467b5be98 |
line wrap: on
line source
/* * QuickTime MOV file parser * copyright(c) 2001 A'rpi * additional work by Atmos * based on TOOLS/movinfo.c by A'rpi & Al3x * compressed header support from moov.c of the openquicktime lib. * * references: http://openquicktime.sf.net/, http://www.heroinewarrior.com/ * http://www.geocities.com/SiliconValley/Lakes/2160/fformats/files/mov.pdf * (above URL no longer works, file mirrored somewhere? ::atmos) * The QuickTime File Format PDF from Apple: * http://developer.apple.com/techpubs/quicktime/qtdevdocs/PDF/QTFileFormat.pdf * (Complete list of documentation at http://developer.apple.com/quicktime/) * MP4-Lib sources from http://mpeg4ip.sf.net/ might be useful for .mp4 * as well as .mov specific stuff. * * All sort of Stuff about MPEG4: * http://www.cmlab.csie.ntu.edu.tw/~pkhsiao/thesis.html * I really recommend N4270-1.doc and N4270-2.doc which are exact specs * of the MP4-File Format and the MPEG4 Specific extensions. ::atmos * TSGS#15(02)0088 * http://www.3gpp.org/ftp/tsg_sa/TSG_SA/TSGS_15/Docs/pdf/SP-020088.pdf * http://www.3gpp2.org/Public_html/specs/C.S0050-0_v1.0_121503.pdf * * This file is part of MPlayer. * * MPlayer is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * MPlayer is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along * with MPlayer; if not, write to the Free Software Foundation, Inc., * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */ #include <stdio.h> #include <stdlib.h> #include <unistd.h> #include <inttypes.h> #include "config.h" #ifdef CONFIG_QUICKTIME #include <QuickTime/QuickTime.h> #include <QuickTime/ImageCompression.h> #include <QuickTime/ImageCodec.h> #else #include "loader/qtx/qtxsdk/components.h" #endif #include "mp_msg.h" #include "help_mp.h" #include "stream/stream.h" #include "demuxer.h" #include "stheader.h" #include "libmpcodecs/img_format.h" #include "libavutil/common.h" #include "libavutil/intreadwrite.h" #include "sub/sub.h" #include "demux_mov.h" #include "qtpalette.h" #include "parse_mp4.h" // .MP4 specific stuff #if CONFIG_ZLIB #include <zlib.h> #endif #ifndef _FCNTL_H #include <fcntl.h> #endif #define char2short(x,y) AV_RB16(&(x)[(y)]) #define char2int(x,y) AV_RB32(&(x)[(y)]) typedef struct { unsigned int pts; // duration unsigned int size; off_t pos; } mov_sample_t; typedef struct { unsigned int sample; // number of the first sample in the chunk unsigned int size; // number of samples in the chunk int desc; // for multiple codecs mode - not used off_t pos; } mov_chunk_t; typedef struct { unsigned int first; unsigned int spc; unsigned int sdid; } mov_chunkmap_t; typedef struct { unsigned int num; unsigned int dur; } mov_durmap_t; typedef struct { unsigned int dur; unsigned int pos; int speed; // int frames; int start_sample; int start_frame; int pts_offset; } mov_editlist_t; #define MOV_TRAK_UNKNOWN 0 #define MOV_TRAK_VIDEO 1 #define MOV_TRAK_AUDIO 2 #define MOV_TRAK_FLASH 3 #define MOV_TRAK_GENERIC 4 #define MOV_TRAK_CODE 5 typedef struct { int id; int type; off_t pos; // unsigned int media_handler; unsigned int data_handler; // int timescale; unsigned int length; int samplesize; // 0 = variable int duration; // 0 = variable int width,height; // for video unsigned int fourcc; unsigned int nchannels; unsigned int samplebytes; // int tkdata_len; // track data unsigned char* tkdata; int stdata_len; // stream data unsigned char* stdata; // unsigned char* stream_header; int stream_header_len; // if >0, this header should be sent before the 1st frame // int samples_size; mov_sample_t* samples; int chunks_size; mov_chunk_t* chunks; int chunkmap_size; mov_chunkmap_t* chunkmap; int durmap_size; mov_durmap_t* durmap; int keyframes_size; unsigned int* keyframes; int editlist_size; mov_editlist_t* editlist; int editlist_pos; // void* desc; // image/sound/etc description (pointer to ImageDescription etc) } mov_track_t; static void mov_build_index(mov_track_t* trak,int timescale){ int i,j,s; int last=trak->chunks_size; unsigned int pts=0; #if 0 if (trak->chunks_size <= 0) { mp_msg(MSGT_DEMUX, MSGL_WARN, "No chunk offset table, trying to build one!\n"); trak->chunks_size = trak->samples_size; /* XXX: FIXME ! */ // audit: this code will be vulnerable if it is reenabled (currently #if 0) trak->chunks = realloc(trak->chunks, sizeof(mov_chunk_t)*trak->chunks_size); for (i=0; i < trak->chunks_size; i++) trak->chunks[i].pos = -1; } #endif mp_msg(MSGT_DEMUX, MSGL_V, "MOV track #%d: %d chunks, %d samples\n",trak->id,trak->chunks_size,trak->samples_size); mp_msg(MSGT_DEMUX, MSGL_V, "pts=%d scale=%d time=%5.3f\n",trak->length,trak->timescale,(float)trak->length/(float)trak->timescale); // process chunkmap: i=trak->chunkmap_size; while(i>0){ --i; j=trak->chunkmap[i].first; for(;j>=0 && j<last;j++){ trak->chunks[j].desc=trak->chunkmap[i].sdid; trak->chunks[j].size=trak->chunkmap[i].spc; } last=FFMIN(trak->chunkmap[i].first, trak->chunks_size); } #if 0 for (i=0; i < trak->chunks_size; i++) { /* fixup position */ if (trak->chunks[i].pos == -1) if (i > 0) trak->chunks[i].pos = trak->chunks[i-1].pos + trak->chunks[i-1].size; else trak->chunks[i].pos = 0; /* FIXME: set initial pos */ #endif // calc pts of chunks: s=0; for(j=0;j<trak->chunks_size;j++){ trak->chunks[j].sample=s; s+=trak->chunks[j].size; } i = 0; for (j = 0; j < trak->durmap_size; j++) i += trak->durmap[j].num; if (i != s) { mp_msg(MSGT_DEMUX, MSGL_WARN, "MOV: durmap and chunkmap sample count differ (%i vs %i)\n", i, s); if (i > s) s = i; } // workaround for fixed-size video frames (dv and uncompressed) if(!trak->samples_size && trak->type!=MOV_TRAK_AUDIO){ trak->samples=calloc(s, sizeof(mov_sample_t)); trak->samples_size=trak->samples ? s : 0; for(i=0;i<trak->samples_size;i++) trak->samples[i].size=trak->samplesize; trak->samplesize=0; } if(!trak->samples_size){ // constant sampesize if(trak->durmap_size==1 || (trak->durmap_size==2 && trak->durmap[1].num==1)){ trak->duration=trak->durmap[0].dur; } else mp_msg(MSGT_DEMUX, MSGL_ERR, "*** constant samplesize & variable duration not yet supported! ***\nContact the author if you have such sample file!\n"); return; } if (trak->samples_size < s) { mp_msg(MSGT_DEMUX, MSGL_WARN, "MOV: durmap or chunkmap bigger than sample count (%i vs %i)\n", s, trak->samples_size); free(trak->samples); trak->samples = calloc(s, sizeof(mov_sample_t)); trak->samples_size = trak->samples ? s : 0; } // calc pts: s=0; for(j=0;j<trak->durmap_size;j++){ for(i=0;i<trak->durmap[j].num;i++){ if (s >= trak->samples_size) break; trak->samples[s].pts=pts; ++s; pts+=trak->durmap[j].dur; } } // calc sample offsets s=0; for(j=0;j<trak->chunks_size;j++){ off_t pos=trak->chunks[j].pos; for(i=0;i<trak->chunks[j].size;i++){ if (s >= trak->samples_size) break; trak->samples[s].pos=pos; mp_msg(MSGT_DEMUX, MSGL_DBG3, "Sample %5d: pts=%8d off=0x%08X size=%d\n",s, trak->samples[s].pts, (int)trak->samples[s].pos, trak->samples[s].size); pos+=trak->samples[s].size; ++s; } } // precalc editlist entries if(trak->editlist_size>0){ int frame=0; int e_pts=0; for(i=0;i<trak->editlist_size;i++){ mov_editlist_t* el=&trak->editlist[i]; int sample=0; int pts=el->pos; el->start_frame=frame; if(pts<0){ // skip! el->frames=0; continue; } // find start sample for(;sample<trak->samples_size;sample++){ if(pts<=trak->samples[sample].pts) break; } el->start_sample=sample; el->pts_offset=((long long)e_pts*(long long)trak->timescale)/(long long)timescale-trak->samples[sample].pts; pts+=((long long)el->dur*(long long)trak->timescale)/(long long)timescale; e_pts+=el->dur; // find end sample for(;sample<trak->samples_size;sample++){ if(pts<trak->samples[sample].pts) break; } el->frames=sample-el->start_sample; frame+=el->frames; mp_msg(MSGT_DEMUX,MSGL_V,"EL#%d: pts=%d 1st_sample=%d frames=%d (%5.3fs) pts_offs=%d\n",i, el->pos,el->start_sample, el->frames, (float)(el->dur)/(float)timescale, el->pts_offset); } } } #define MOV_MAX_TRACKS 256 #define MOV_MAX_SUBLEN 1024 typedef struct { off_t moov_start; off_t moov_end; off_t mdat_start; off_t mdat_end; int track_db; mov_track_t* tracks[MOV_MAX_TRACKS]; int timescale; // movie timescale int duration; // movie duration (in movie timescale units) subtitle subs; char subtext[MOV_MAX_SUBLEN + 1]; int current_sub; } mov_priv_t; #define MOV_FOURCC(a,b,c,d) ((a<<24)|(b<<16)|(c<<8)|(d)) static int mov_check_file(demuxer_t* demuxer){ int flags=0; int no=0; mov_priv_t* priv=calloc(1, sizeof(mov_priv_t)); mp_msg(MSGT_DEMUX,MSGL_V,"Checking for MOV\n"); priv->current_sub = -1; while(1){ int i; int skipped=8; off_t len=stream_read_dword(demuxer->stream); unsigned int id=stream_read_dword(demuxer->stream); if(stream_eof(demuxer->stream)) break; // EOF if (len == 1) /* real size is 64bits - cjb */ { #ifndef _LARGEFILE_SOURCE if (stream_read_dword(demuxer->stream) != 0) mp_msg(MSGT_DEMUX, MSGL_WARN, "64bit file, but you've compiled MPlayer without LARGEFILE support!\n"); len = stream_read_dword(demuxer->stream); #else len = stream_read_qword(demuxer->stream); #endif skipped += 8; } #if 0 else if (len == 0) /* deleted chunk */ { /* XXX: CJB! is this right? - alex */ goto skip_chunk; } #endif if(len<8) break; // invalid chunk switch(id){ case MOV_FOURCC('f','t','y','p'): { unsigned int tmp; // File Type Box (ftyp): // char[4] major_brand (eg. 'isom') // int minor_version (eg. 0x00000000) // char[4] compatible_brands[] (eg. 'mp41') // compatible_brands list spans to the end of box #if 1 tmp = stream_read_dword(demuxer->stream); switch(tmp) { case MOV_FOURCC('i','s','o','m'): mp_msg(MSGT_DEMUX,MSGL_V,"ISO: File Type Major Brand: ISO Base Media\n"); break; case MOV_FOURCC('m','p','4','1'): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: ISO/IEC 14496-1 (MPEG-4 system) v1\n"); break; case MOV_FOURCC('m','p','4','2'): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: ISO/IEC 14496-1 (MPEG-4 system) v2\n"); break; case MOV_FOURCC('M','4','A',' '): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: Apple iTunes AAC-LC Audio\n"); break; case MOV_FOURCC('M','4','P',' '): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: Apple iTunes AAC-LC Protected Audio\n"); break; case MOV_FOURCC('q','t',' ',' '): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: Original QuickTime\n"); break; case MOV_FOURCC('3','g','p','1'): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: 3GPP Profile 1\n"); break; case MOV_FOURCC('3','g','p','2'): case MOV_FOURCC('3','g','2','a'): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: 3GPP Profile 2\n"); break; case MOV_FOURCC('3','g','p','3'): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: 3GPP Profile 3\n"); break; case MOV_FOURCC('3','g','p','4'): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: 3GPP Profile 4\n"); break; case MOV_FOURCC('3','g','p','5'): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: 3GPP Profile 5\n"); break; case MOV_FOURCC('m','m','p','4'): mp_msg(MSGT_DEMUX,MSGL_INFO,"ISO: File Type Major Brand: Mobile ISO/IEC 14496-1 (MPEG-4 system)\n"); break; default: tmp = be2me_32(tmp); mp_msg(MSGT_DEMUX,MSGL_WARN,"ISO: Unknown File Type Major Brand: %.4s\n",(char *)&tmp); } mp_msg(MSGT_DEMUX,MSGL_V,"ISO: File Type Minor Version: %d\n", stream_read_dword(demuxer->stream)); skipped += 8; // List all compatible brands for(i = 0; i < ((len-16)/4); i++) { tmp = be2me_32(stream_read_dword(demuxer->stream)); mp_msg(MSGT_DEMUX,MSGL_V,"ISO: File Type Compatible Brand #%d: %.4s\n",i,(char *)&tmp); skipped += 4; } #endif } break; case MOV_FOURCC('m','o','o','v'): // case MOV_FOURCC('c','m','o','v'): mp_msg(MSGT_DEMUX,MSGL_V,"MOV: Movie header found!\n"); priv->moov_start=(off_t)stream_tell(demuxer->stream); priv->moov_end=(off_t)priv->moov_start+len-skipped; mp_msg(MSGT_DEMUX,MSGL_DBG2,"MOV: Movie header: start: %"PRIx64" end: %"PRIx64"\n", (int64_t)priv->moov_start, (int64_t)priv->moov_end); skipped+=8; i = stream_read_dword(demuxer->stream)-8; if(stream_read_dword(demuxer->stream)==MOV_FOURCC('r','m','r','a')){ skipped+=i; mp_msg(MSGT_DEMUX,MSGL_INFO,"MOV: Reference Media file!!!\n"); //set demuxer type to playlist ... demuxer->type=DEMUXER_TYPE_PLAYLIST; while(i>0){ int len=stream_read_dword(demuxer->stream)-8; int fcc=stream_read_dword(demuxer->stream); if(len<0) break; // EOF!? i-=8; // printf("i=%d len=%d\n",i,len); switch(fcc){ case MOV_FOURCC('r','m','d','a'): continue; case MOV_FOURCC('r','d','r','f'): { av_unused int tmp=stream_read_dword(demuxer->stream); av_unused int type=stream_read_dword_le(demuxer->stream); int slen=stream_read_dword(demuxer->stream); //char* s=malloc(slen+1); //stream_read(demuxer->stream,s,slen); //FIXME: also store type & data_rate ? ds_read_packet(demuxer->video, demuxer->stream, slen, 0, stream_tell(demuxer->stream), 0 // no flags ); flags|=4; mp_msg(MSGT_DEMUX,MSGL_V,"Added reference to playlist\n"); //s[slen]=0; //mp_msg(MSGT_DEMUX,MSGL_INFO,"REF: [%.4s] %s\n",&type,s); len-=12+slen;i-=12+slen; break; } case MOV_FOURCC('r','m','d','r'): { av_unused int flags=stream_read_dword(demuxer->stream); int rate=stream_read_dword(demuxer->stream); mp_msg(MSGT_DEMUX,MSGL_V," min. data rate: %d bits/sec\n",rate); len-=8; i-=8; break; } case MOV_FOURCC('r','m','q','u'): { int q=stream_read_dword(demuxer->stream); mp_msg(MSGT_DEMUX,MSGL_V," quality index: %d\n",q); len-=4; i-=4; break; } } i-=len;stream_skip(demuxer->stream,len); } } flags|=1; break; case MOV_FOURCC('w','i','d','e'): mp_msg(MSGT_DEMUX,MSGL_V,"MOV: 'WIDE' chunk found!\n"); if(flags&2) break; case MOV_FOURCC('m','d','a','t'): mp_msg(MSGT_DEMUX,MSGL_V,"MOV: Movie DATA found!\n"); priv->mdat_start=stream_tell(demuxer->stream); priv->mdat_end=priv->mdat_start+len-skipped; mp_msg(MSGT_DEMUX,MSGL_DBG2,"MOV: Movie data: start: %"PRIx64" end: %"PRIx64"\n", (int64_t)priv->mdat_start, (int64_t)priv->mdat_end); flags|=2; if(flags==3){ // if we're over the headers, then we can stop parsing here! demuxer->priv=priv; return DEMUXER_TYPE_MOV; } break; case MOV_FOURCC('f','r','e','e'): case MOV_FOURCC('s','k','i','p'): case MOV_FOURCC('j','u','n','k'): mp_msg(MSGT_DEMUX,MSGL_DBG2,"MOV: free space (len: %"PRId64")\n", (int64_t)len); /* unused, if you edit a mov, you can use space provided by free atoms (redefining it) */ break; case MOV_FOURCC('p','n','o','t'): case MOV_FOURCC('P','I','C','T'): /* dunno what, but we shoudl ignore it */ break; default: if(no==0){ free(priv); return 0;} // first chunk is bad! id = be2me_32(id); mp_msg(MSGT_DEMUX,MSGL_V,"MOV: unknown chunk: %.4s %d\n",(char *)&id,(int)len); } //skip_chunk: if(!stream_skip(demuxer->stream,len-skipped)) break; ++no; } if(flags==3){ demuxer->priv=priv; return DEMUXER_TYPE_MOV; } free(priv); if ((flags==5) || (flags==7)) // reference & header sent return DEMUXER_TYPE_PLAYLIST; if(flags==1) mp_msg(MSGT_DEMUX,MSGL_WARN,"MOV: missing data (mdat) chunk! Maybe broken file...\n"); else if(flags==2) mp_msg(MSGT_DEMUX,MSGL_WARN,"MOV: missing header (moov/cmov) chunk! Maybe broken file...\n"); return 0; } static void demux_close_mov(demuxer_t *demuxer) { mov_priv_t* priv = demuxer->priv; int i; if (!priv) return; for (i = 0; i < MOV_MAX_TRACKS; i++) { mov_track_t *track = priv->tracks[i]; if (track) { free(track->tkdata); free(track->stdata); free(track->stream_header); free(track->samples); free(track->chunks); free(track->chunkmap); free(track->durmap); free(track->keyframes); free(track->editlist); free(track->desc); free(track); } } free(priv); } unsigned int store_ughvlc(unsigned char *s, unsigned int v){ unsigned int n = 0; while(v >= 0xff) { *s++ = 0xff; v -= 0xff; n++; } *s = v; n++; return n; } static void init_vobsub(sh_sub_t *sh, mov_track_t *trak) { sh->type = 'v'; if (trak->stdata_len < 106) return; sh->extradata_len = 16*4; sh->extradata = malloc(sh->extradata_len); memcpy(sh->extradata, trak->stdata + 42, sh->extradata_len); } static int lschunks_intrak(demuxer_t* demuxer, int level, unsigned int id, off_t pos, off_t len, mov_track_t* trak); static int gen_sh_audio(sh_audio_t* sh, mov_track_t* trak, int timescale) { #if 0 struct { int16_t version; // 0 or 1 (version 1 is qt3.0+) int16_t revision; // 0 int32_t vendor_id; // 0 int16_t channels; // 1 or 2 (Mono/Stereo) int16_t samplesize; // 8 or 16 (8Bit/16Bit) int16_t compression_id; // if version 0 then 0 // if version 1 and vbr then -2 else 0 int16_t packet_size; // 0 uint16_t sample_rate; // samplerate (Hz) // qt3.0+ (version == 1) uint32_t samples_per_packet; // 0 or num uncompressed samples in a packet // if 0 below three values are also 0 uint32_t bytes_per_packet; // 0 or num compressed bytes for one channel uint32_t bytes_per_frame; // 0 or num compressed bytes for all channels // (channels * bytes_per_packet) uint32_t bytes_per_sample; // 0 or size of uncompressed sample // if samples_per_packet and bytes_per_packet are constant (CBR) // then bytes_per_frame and bytes_per_sample must be 0 (else is VBR) // --- // optional additional atom-based fields // ([int32_t size,int32_t type,some data ],repeat) } my_stdata; #endif int version, adjust; int is_vorbis = 0; sh->format=trak->fourcc; // crude audio delay from editlist0 hack ::atm if(trak->editlist_size>=1) { if(trak->editlist[0].pos == -1) { sh->stream_delay = (float)trak->editlist[0].dur/(float)timescale; mp_msg(MSGT_DEMUX,MSGL_V,"MOV: Initial Audio-Delay: %.3f sec\n", sh->stream_delay); } } switch( sh->format ) { case 0x726D6173: /* samr */ /* amr narrowband */ trak->samplebytes=sh->samplesize=1; trak->nchannels=sh->channels=1; sh->samplerate=8000; break; case 0x62776173: /* sawb */ /* amr wideband */ trak->samplebytes=sh->samplesize=1; trak->nchannels=sh->channels=1; sh->samplerate=16000; break; default: // assumptions for below table: short is 16bit, int is 32bit, intfp is 16bit // XXX: 32bit fixed point numbers (intfp) are only 2 Byte! // short values are usually one byte leftpadded by zero // int values are usually two byte leftpadded by zero // stdata[]: // 8 short version // 10 short revision // 12 int vendor_id // 16 short channels // 18 short samplesize // 20 short compression_id // 22 short packet_size (==0) // 24 intfp sample_rate // (26 short) unknown (==0) // ---- qt3.0+ (version>=1) // 28 int samples_per_packet // 32 int bytes_per_packet // 36 int bytes_per_frame // 40 int bytes_per_sample // there may be additional atoms following at 28 (version 0) // or 44 (version 1), eg. esds atom of .MP4 files // esds atom: // 28 int atom size (bytes of int size, int type and data) // 32 char[4] atom type (fourc charater code -> esds) // 36 char[] atom data (len=size-8) // TODO: fix parsing for files using version 2. if (trak->stdata_len < 26) { mp_msg(MSGT_DEMUX, MSGL_WARN, "MOV: broken (too small) sound atom!\n"); return 0; } version=char2short(trak->stdata,8); if (version > 1) mp_msg(MSGT_DEMUX, MSGL_WARN, "MOV: version %d sound atom may not parse correctly!\n", version); trak->samplebytes=sh->samplesize=char2short(trak->stdata,18)/8; /* I can't find documentation, but so far this is the case. -Corey */ switch (char2short(trak->stdata,16)) { case 1: trak->nchannels = 1; break; case 2: trak->nchannels = 2; break; case 3: trak->nchannels = 6; break; default: mp_msg(MSGT_DEMUX, MSGL_WARN, "MOV: unable to determine audio channels, assuming 2 (got %d)\n", char2short(trak->stdata,16)); trak->nchannels = 2; } sh->channels = trak->nchannels; /*printf("MOV: timescale: %d samplerate: %d durmap: %d (%d) -> %d (%d)\n", trak->timescale, char2short(trak->stdata,24), trak->durmap[0].dur, trak->durmap[0].num, trak->timescale/trak->durmap[0].dur, char2short(trak->stdata,24)/trak->durmap[0].dur);*/ sh->samplerate=char2short(trak->stdata,24); if((sh->samplerate < 7000) && trak->durmap && trak->durmap[0].dur > 1) { switch(char2short(trak->stdata,24)/trak->durmap[0].dur) { // TODO: add more cases. case 31: sh->samplerate = 32000; break; case 43: sh->samplerate = 44100; break; case 47: sh->samplerate = 48000; break; default: mp_msg(MSGT_DEMUX, MSGL_WARN, "MOV: unable to determine audio samplerate, " "assuming 44.1kHz (got %d)\n", char2short(trak->stdata,24)/trak->durmap[0].dur); sh->samplerate = 44100; } } } mp_msg(MSGT_DEMUX, MSGL_V, "Audio bits: %d chans: %d rate: %d\n", sh->samplesize*8,sh->channels,sh->samplerate); if(trak->stdata_len >= 44 && trak->stdata[9]>=1){ mp_msg(MSGT_DEMUX,MSGL_V,"Audio header: samp/pack=%d bytes/pack=%d bytes/frame=%d bytes/samp=%d \n", char2int(trak->stdata,28), char2int(trak->stdata,32), char2int(trak->stdata,36), char2int(trak->stdata,40)); if(trak->stdata_len>=44+8){ int len=char2int(trak->stdata,44); int fcc=char2int(trak->stdata,48); // we have extra audio headers!!! mp_msg(MSGT_DEMUX,MSGL_V,"Audio extra header: len=%d fcc=0x%X\n",len,fcc); if((len >= 4) && (char2int(trak->stdata,52) >= 12) && (char2int(trak->stdata,52+4) == MOV_FOURCC('f','r','m','a'))) { switch(char2int(trak->stdata,52+8)) { case MOV_FOURCC('a','l','a','c'): if (len >= 36 + char2int(trak->stdata,52)) { sh->codecdata_len = char2int(trak->stdata,52+char2int(trak->stdata,52)); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found alac atom (%d)!\n", sh->codecdata_len); sh->codecdata = malloc(sh->codecdata_len); memcpy(sh->codecdata, &trak->stdata[52+char2int(trak->stdata,52)], sh->codecdata_len); } break; case MOV_FOURCC('i','n','2','4'): case MOV_FOURCC('i','n','3','2'): case MOV_FOURCC('f','l','3','2'): case MOV_FOURCC('f','l','6','4'): if ((len >= 22) && (char2int(trak->stdata,52+16)==MOV_FOURCC('e','n','d','a')) && (char2short(trak->stdata,52+20))) { sh->format=char2int(trak->stdata,52+8); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found little endian PCM data, reversed fourcc:%04x\n", sh->format); } break; default: if (len > 8 && len + 44 <= trak->stdata_len) { sh->codecdata_len = len-8; sh->codecdata = malloc(sh->codecdata_len); memcpy(sh->codecdata, trak->stdata+44+8, sh->codecdata_len); } } } else { if (len > 8 && len + 44 <= trak->stdata_len) { sh->codecdata_len = len-8; sh->codecdata = malloc(sh->codecdata_len); memcpy(sh->codecdata, trak->stdata+44+8, sh->codecdata_len); } } } } switch (version) { case 0: adjust = 0; break; case 1: adjust = 48; break; case 2: adjust = 68; break; default: mp_msg(MSGT_DEMUX, MSGL_WARN, "MOV: unknown sound atom version (%d); may not work!\n", version); adjust = 68; } if (trak->stdata_len >= 36 + adjust) { int atom_len = char2int(trak->stdata,28+adjust); if (atom_len < 0 || atom_len > trak->stdata_len - 28 - adjust) atom_len = trak->stdata_len - 28 - adjust; switch(char2int(trak->stdata,32+adjust)) { // atom type case MOV_FOURCC('e','s','d','s'): { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found MPEG4 audio Elementary Stream Descriptor atom (%d)!\n", atom_len); if(atom_len > 8) { esds_t esds; if(!mp4_parse_esds(&trak->stdata[36+adjust], atom_len-8, &esds)) { /* 0xdd is a "user private" id, not an official allocated id (see http://www.mp4ra.org/object.html), so perform some extra checks to be sure that this is really vorbis audio */ if(esds.objectTypeId==0xdd && esds.streamType==0x15 && sh->format==0x6134706D && esds.decoderConfigLen > 8) { //vorbis audio unsigned char *buf[3]; unsigned short sizes[3]; int offset, len, k; unsigned char *ptr = esds.decoderConfig; if(ptr[0] != 0 || ptr[1] != 30) goto quit_vorbis_block; //wrong extradata layout offset = len = 0; for(k = 0; k < 3; k++) { sizes[k] = (ptr[offset]<<8) | ptr[offset+1]; len += sizes[k]; offset += 2; if(offset + sizes[k] > esds.decoderConfigLen) { mp_msg(MSGT_DEMUX, MSGL_FATAL, "MOV: ERROR!, not enough vorbis extradata to read: offset = %d, k=%d, size=%d, len: %d\n", offset, k, sizes[k], esds.decoderConfigLen); goto quit_vorbis_block; } buf[k] = malloc(sizes[k]); if(!buf[k]) goto quit_vorbis_block; memcpy(buf[k], &ptr[offset], sizes[k]); offset += sizes[k]; } sh->codecdata_len = len + len/255 + 64; sh->codecdata = malloc(sh->codecdata_len); ptr = sh->codecdata; ptr[0] = 2; offset = 1; offset += store_ughvlc(&ptr[offset], sizes[0]); offset += store_ughvlc(&ptr[offset], sizes[1]); for(k = 0; k < 3; k++) { memcpy(&ptr[offset], buf[k], sizes[k]); offset += sizes[k]; } sh->codecdata_len = offset; sh->codecdata = realloc(sh->codecdata, offset); mp_msg(MSGT_DEMUX,MSGL_V, "demux_mov, vorbis extradata size: %d\n", offset); is_vorbis = 1; quit_vorbis_block: sh->format = mmioFOURCC('v', 'r', 'b', 's'); } sh->i_bps = esds.avgBitrate/8; // printf("######## audio format = %d ########\n",esds.objectTypeId); if(esds.objectTypeId==MP4OTI_MPEG1Audio || esds.objectTypeId==MP4OTI_MPEG2AudioPart3) sh->format=0x55; // .mp3 if(esds.objectTypeId==MP4OTI_13kVoice) { // 13K Voice, defined by 3GPP2 sh->format=mmioFOURCC('Q', 'c', 'l', 'p'); trak->nchannels=sh->channels=1; trak->samplebytes=sh->samplesize=1; } // dump away the codec specific configuration for the AAC decoder if(esds.decoderConfigLen){ if( (esds.decoderConfig[0]>>3) == 29 ) sh->format = 0x1d61346d; // request multi-channel mp3 decoder if(!is_vorbis) { sh->codecdata_len = esds.decoderConfigLen; sh->codecdata = malloc(sh->codecdata_len); memcpy(sh->codecdata, esds.decoderConfig, sh->codecdata_len); } } } mp4_free_esds(&esds); // freeup esds mem #if 0 { FILE* f=fopen("esds.dat","wb"); fwrite(&trak->stdata[36],atom_len-8,1,f); fclose(f); } #endif } } break; case MOV_FOURCC('a','l','a','c'): { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found alac atom (%d)!\n", atom_len); if(atom_len > 8) { // copy all the atom (not only payload) for lavc alac decoder sh->codecdata_len = atom_len; sh->codecdata = malloc(sh->codecdata_len); memcpy(sh->codecdata, &trak->stdata[28], sh->codecdata_len); } } break; case MOV_FOURCC('d','a','m','r'): mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found AMR audio atom %c%c%c%c (%d)!\n", trak->stdata[32+adjust],trak->stdata[33+adjust],trak->stdata[34+adjust],trak->stdata[35+adjust], atom_len); if (atom_len>14) { mp_msg(MSGT_DEMUX, MSGL_V, "mov: vendor: %c%c%c%c Version: %d\n",trak->stdata[36+adjust],trak->stdata[37+adjust],trak->stdata[38+adjust], trak->stdata[39+adjust],trak->stdata[40+adjust]); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Modes set: %02x%02x\n",trak->stdata[41+adjust],trak->stdata[42+adjust]); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Mode change period: %d Frames per sample: %d\n",trak->stdata[43+adjust],trak->stdata[44+adjust]); } break; default: mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found unknown audio atom %c%c%c%c (%d)!\n", trak->stdata[32+adjust],trak->stdata[33+adjust],trak->stdata[34+adjust],trak->stdata[35+adjust], atom_len); } } mp_msg(MSGT_DEMUX, MSGL_V, "Fourcc: %.4s\n",(char *)&trak->fourcc); #if 0 { FILE* f=fopen("stdata.dat","wb"); fwrite(trak->stdata,trak->stdata_len,1,f); fclose(f); } { FILE* f=fopen("tkdata.dat","wb"); fwrite(trak->tkdata,trak->tkdata_len,1,f); fclose(f); } #endif // Emulate WAVEFORMATEX struct: sh->wf=calloc(1, sizeof(*sh->wf) + (is_vorbis ? sh->codecdata_len : 0)); sh->wf->nChannels=sh->channels; sh->wf->wBitsPerSample=(trak->stdata[18]<<8)+trak->stdata[19]; // sh->wf->nSamplesPerSec=trak->timescale; sh->wf->nSamplesPerSec=sh->samplerate; if(trak->stdata_len >= 44 && trak->stdata[9]>=1 && char2int(trak->stdata,28)>0){ //Audio header: samp/pack=4096 bytes/pack=743 bytes/frame=1486 bytes/samp=2 sh->wf->nAvgBytesPerSec=(sh->wf->nChannels*sh->wf->nSamplesPerSec* char2int(trak->stdata,32)+char2int(trak->stdata,28)/2) /char2int(trak->stdata,28); sh->wf->nBlockAlign=char2int(trak->stdata,36); } else { sh->wf->nAvgBytesPerSec=sh->wf->nChannels*sh->wf->wBitsPerSample*sh->wf->nSamplesPerSec/8; // workaround for ms11 ima4 if (sh->format == 0x1100736d && trak->stdata_len >= 36) sh->wf->nBlockAlign=char2int(trak->stdata,36); } if(is_vorbis && sh->codecdata_len) { memcpy(sh->wf+1, sh->codecdata, sh->codecdata_len); sh->wf->cbSize = sh->codecdata_len; } // Selection: // if(demuxer->audio->id==-1 || demuxer->audio->id==priv->track_db){ // // (auto)selected audio track: // demuxer->audio->id=priv->track_db; // demuxer->audio->sh=sh; sh->ds=demuxer->audio; // } return 1; } static int gen_sh_video(sh_video_t* sh, mov_track_t* trak, int timescale) { int depth, i, entry; int flag, start, count_flag, end, palette_count, gray; int hdr_ptr = 76; // the byte just after depth unsigned char *palette_map; sh->format=trak->fourcc; // crude video delay from editlist0 hack ::atm if(trak->editlist_size>=1) { if(trak->editlist[0].pos == -1) { sh->stream_delay = (float)trak->editlist[0].dur/(float)timescale; mp_msg(MSGT_DEMUX,MSGL_V,"MOV: Initial Video-Delay: %.3f sec\n", sh->stream_delay); } } if (trak->stdata_len < 78) { mp_msg(MSGT_DEMUXER, MSGL_WARN, "MOV: Invalid (%d bytes instead of >= 78) video trak desc\n", trak->stdata_len); return 0; } depth = trak->stdata[75] | (trak->stdata[74] << 8); if (trak->fourcc == mmioFOURCC('r', 'a', 'w', ' ')) sh->format = IMGFMT_RGB | depth; // stdata[]: // 8 short version // 10 short revision // 12 int vendor_id // 16 int temporal_quality // 20 int spatial_quality // 24 short width // 26 short height // 28 int h_dpi // 32 int v_dpi // 36 int 0 // 40 short frames_per_sample // 42 char[4] compressor_name // 74 short depth // 76 short color_table_id // additional atoms may follow, // eg esds atom from .MP4 files // 78 int atom size // 82 char[4] atom type // 86 ... atom data { ImageDescription* id=malloc(8+trak->stdata_len); // safe trak->desc=id; id->idSize=8+trak->stdata_len; // id->cType=bswap_32(trak->fourcc); id->cType=le2me_32(trak->fourcc); id->version=char2short(trak->stdata,8); id->revisionLevel=char2short(trak->stdata,10); id->vendor=char2int(trak->stdata,12); id->temporalQuality=char2int(trak->stdata,16); id->spatialQuality=char2int(trak->stdata,20); id->width=char2short(trak->stdata,24); id->height=char2short(trak->stdata,26); id->hRes=char2int(trak->stdata,28); id->vRes=char2int(trak->stdata,32); id->dataSize=char2int(trak->stdata,36); id->frameCount=char2short(trak->stdata,40); memcpy(&id->name,trak->stdata+42,32); id->depth=char2short(trak->stdata,74); id->clutID=char2short(trak->stdata,76); if(trak->stdata_len>78) memcpy(((char*)&id->clutID)+2,trak->stdata+78,trak->stdata_len-78); sh->ImageDesc=id; #if 0 { FILE *f=fopen("ImageDescription","wb"); fwrite(id,id->idSize,1,f); fclose(f); } #endif } if(trak->stdata_len >= 86) { // extra atoms found int pos=78; int atom_len; while(pos+8<=trak->stdata_len && (pos+(atom_len=char2int(trak->stdata,pos)))<=trak->stdata_len){ switch(char2int(trak->stdata,pos+4)) { // switch atom type case MOV_FOURCC('g','a','m','a'): // intfp with gamma value at which movie was captured // can be used to gamma correct movie display mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found unsupported Gamma-Correction movie atom (%d)!\n", atom_len); break; case MOV_FOURCC('f','i','e','l'): // 2 char-values (8bit int) that specify field handling // see the Apple's QuickTime Fileformat PDF for more info mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found unsupported Field-Handling movie atom (%d)!\n", atom_len); break; case MOV_FOURCC('m','j','q','t'): // Motion-JPEG default quantization table mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found unsupported MJPEG-Quantization movie atom (%d)!\n", atom_len); break; case MOV_FOURCC('m','j','h','t'): // Motion-JPEG default huffman table mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found unsupported MJPEG-Huffman movie atom (%d)!\n", atom_len); break; case MOV_FOURCC('e','s','d','s'): // MPEG4 Elementary Stream Descriptor header mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found MPEG4 movie Elementary Stream Descriptor atom (%d)!\n", atom_len); // add code here to save esds header of length atom_len-8 // beginning at stdata[86] to some variable to pass it // on to the decoder ::atmos if(atom_len > 8) { esds_t esds; if(!mp4_parse_esds(trak->stdata+pos+8, atom_len-8, &esds)) { if(esds.objectTypeId==MP4OTI_MPEG2VisualSimple || esds.objectTypeId==MP4OTI_MPEG2VisualMain || esds.objectTypeId==MP4OTI_MPEG2VisualSNR || esds.objectTypeId==MP4OTI_MPEG2VisualSpatial || esds.objectTypeId==MP4OTI_MPEG2VisualHigh || esds.objectTypeId==MP4OTI_MPEG2Visual422) sh->format=mmioFOURCC('m', 'p', 'g', '2'); else if(esds.objectTypeId==MP4OTI_MPEG1Visual) sh->format=mmioFOURCC('m', 'p', 'g', '1'); // dump away the codec specific configuration for the AAC decoder trak->stream_header_len = esds.decoderConfigLen; trak->stream_header = malloc(trak->stream_header_len); memcpy(trak->stream_header, esds.decoderConfig, trak->stream_header_len); } mp4_free_esds(&esds); // freeup esds mem } break; case MOV_FOURCC('a','v','c','C'): // AVC decoder configuration record mp_msg(MSGT_DEMUX, MSGL_V, "MOV: AVC decoder configuration record atom (%d)!\n", atom_len); if(atom_len > 8) { int i, poffs, cnt; // Parse some parts of avcC, just for fun :) // real parsing is done by avc1 decoder mp_msg(MSGT_DEMUX, MSGL_V, "MOV: avcC version: %d\n", *(trak->stdata+pos+8)); if (*(trak->stdata+pos+8) != 1) mp_msg(MSGT_DEMUX, MSGL_ERR, "MOV: unknown avcC version (%d). Expexct problems.\n", *(trak->stdata+pos+9)); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: avcC profile: %d\n", *(trak->stdata+pos+9)); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: avcC profile compatibility: %d\n", *(trak->stdata+pos+10)); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: avcC level: %d\n", *(trak->stdata+pos+11)); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: avcC nal length size: %d\n", ((*(trak->stdata+pos+12))&0x03)+1); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: avcC number of sequence param sets: %d\n", cnt = (*(trak->stdata+pos+13) & 0x1f)); poffs = pos + 14; for (i = 0; i < cnt; i++) { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: avcC sps %d have length %d\n", i, AV_RB16(trak->stdata+poffs)); poffs += AV_RB16(trak->stdata+poffs) + 2; } mp_msg(MSGT_DEMUX, MSGL_V, "MOV: avcC number of picture param sets: %d\n", *(trak->stdata+poffs)); poffs++; for (i = 0; i < cnt; i++) { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: avcC pps %d have length %d\n", i, AV_RB16(trak->stdata+poffs)); poffs += AV_RB16(trak->stdata+poffs) + 2; } // Copy avcC for the AVC decoder // This data will be put in extradata below, where BITMAPINFOHEADER is created trak->stream_header_len = atom_len-8; trak->stream_header = malloc(trak->stream_header_len); memcpy(trak->stream_header, trak->stdata+pos+8, trak->stream_header_len); } break; case MOV_FOURCC('d','2','6','3'): mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found H.263 decoder atom %c%c%c%c (%d)!\n", trak->stdata[pos+4],trak->stdata[pos+5],trak->stdata[pos+6],trak->stdata[pos+7],atom_len); if (atom_len>10) mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Vendor: %c%c%c%c H.263 level: %d H.263 profile: %d \n", trak->stdata[pos+8],trak->stdata[pos+9],trak->stdata[pos+10],trak->stdata[pos+11],trak->stdata[pos+12],trak->stdata[pos+13]); break; case 0: break; default: mp_msg(MSGT_DEMUX, MSGL_V, "MOV: Found unknown movie atom %c%c%c%c (%d)!\n", trak->stdata[pos+4],trak->stdata[pos+5],trak->stdata[pos+6],trak->stdata[pos+7], atom_len); } if(atom_len<8) break; pos+=atom_len; // printf("pos=%d max=%d\n",pos,trak->stdata_len); } } sh->fps=trak->timescale/ ((trak->durmap_size>=1)?(float)trak->durmap[0].dur:1); sh->frametime=1.0f/sh->fps; sh->disp_w=trak->stdata[25]|(trak->stdata[24]<<8); sh->disp_h=trak->stdata[27]|(trak->stdata[26]<<8); if(trak->tkdata_len>81) { // if image size is zero, fallback to display size if(!sh->disp_w && !sh->disp_h) { sh->disp_w=trak->tkdata[77]|(trak->tkdata[76]<<8); sh->disp_h=trak->tkdata[81]|(trak->tkdata[80]<<8); } else if(sh->disp_w!=(trak->tkdata[77]|(trak->tkdata[76]<<8))){ // codec and display width differ... use display one for aspect sh->aspect=trak->tkdata[77]|(trak->tkdata[76]<<8); sh->aspect/=trak->tkdata[81]|(trak->tkdata[80]<<8); } } if(depth>32+8) mp_msg(MSGT_DEMUX, MSGL_INFO,"*** depth = 0x%X\n",depth); // palettized? gray = 0; if (depth > 32) { depth&=31; gray = 1; } // depth > 32 means grayscale if ((depth == 2) || (depth == 4) || (depth == 8)) palette_count = (1 << depth); else palette_count = 0; // emulate BITMAPINFOHEADER: if (palette_count) { sh->bih=calloc(1, sizeof(*sh->bih) + palette_count * 4); sh->bih->biSize=40 + palette_count * 4; // fetch the relevant fields flag = AV_RB16(&trak->stdata[hdr_ptr]); hdr_ptr += 2; start = AV_RB32(&trak->stdata[hdr_ptr]); hdr_ptr += 4; count_flag = AV_RB16(&trak->stdata[hdr_ptr]); hdr_ptr += 2; end = AV_RB16(&trak->stdata[hdr_ptr]); hdr_ptr += 2; palette_map = (unsigned char *)sh->bih + 40; mp_msg(MSGT_DEMUX, MSGL_V, "Allocated %d entries for palette\n", palette_count); mp_msg(MSGT_DEMUX, MSGL_DBG2, "QT palette: start: %x, end: %x, count flag: %d, flags: %x\n", start, end, count_flag, flag); /* XXX: problems with sample (statunit6.mov) with flag&0x4 set! - alex*/ // load default palette if (flag & 0x08) { if (gray) { mp_msg(MSGT_DEMUX, MSGL_V, "Using default QT grayscale palette\n"); if (palette_count == 16) memcpy(palette_map, qt_default_grayscale_palette_16, 16 * 4); else if (palette_count == 256) { memcpy(palette_map, qt_default_grayscale_palette_256, 256 * 4); if (trak->fourcc == mmioFOURCC('c','v','i','d')) { int i; // Hack for grayscale CVID, negative palette // If you have samples where this is not required contact me (rxt) mp_msg(MSGT_DEMUX, MSGL_V, "MOV: greyscale cvid with default palette," " enabling negative palette hack.\n"); for (i = 0; i < 256 * 4; i++) palette_map[i] = palette_map[i] ^ 0xff; } } } else { mp_msg(MSGT_DEMUX, MSGL_V, "Using default QT colour palette\n"); if (palette_count == 4) memcpy(palette_map, qt_default_palette_4, 4 * 4); else if (palette_count == 16) memcpy(palette_map, qt_default_palette_16, 16 * 4); else if (palette_count == 256) memcpy(palette_map, qt_default_palette_256, 256 * 4); } } // load palette from file else { mp_msg(MSGT_DEMUX, MSGL_V, "Loading palette from file\n"); for (i = start; i <= end; i++) { entry = AV_RB16(&trak->stdata[hdr_ptr]); hdr_ptr += 2; // apparently, if count_flag is set, entry is same as i if (count_flag & 0x8000) entry = i; // only care about top 8 bits of 16-bit R, G, or B value if (entry <= palette_count && entry >= 0) { palette_map[entry * 4 + 2] = trak->stdata[hdr_ptr + 0]; palette_map[entry * 4 + 1] = trak->stdata[hdr_ptr + 2]; palette_map[entry * 4 + 0] = trak->stdata[hdr_ptr + 4]; mp_dbg(MSGT_DEMUX, MSGL_DBG2, "QT palette: added entry: %d of %d (colors: R:%x G:%x B:%x)\n", entry, palette_count, palette_map[entry * 4 + 2], palette_map[entry * 4 + 1], palette_map[entry * 4 + 0]); } else mp_msg(MSGT_DEMUX, MSGL_V, "QT palette: skipped entry (out of count): %d of %d\n", entry, palette_count); hdr_ptr += 6; } } } else { if (trak->fourcc == mmioFOURCC('a','v','c','1')) { if (trak->stream_header_len > 0xffffffff - sizeof(*sh->bih)) { mp_msg(MSGT_DEMUXER, MSGL_ERR, "Invalid extradata size %d, skipping\n",trak->stream_header_len); trak->stream_header_len = 0; } sh->bih=calloc(1, sizeof(*sh->bih) + trak->stream_header_len); sh->bih->biSize=40 + trak->stream_header_len; memcpy(((unsigned char *)sh->bih)+40, trak->stream_header, trak->stream_header_len); free (trak->stream_header); trak->stream_header_len = 0; trak->stream_header = NULL; } else { sh->bih=calloc(1, sizeof(*sh->bih)); sh->bih->biSize=40; } } sh->bih->biWidth=sh->disp_w; sh->bih->biHeight=sh->disp_h; sh->bih->biPlanes=0; sh->bih->biBitCount=depth; sh->bih->biCompression=trak->fourcc; sh->bih->biSizeImage=sh->bih->biWidth*sh->bih->biHeight; mp_msg(MSGT_DEMUX, MSGL_V, "Image size: %d x %d (%d bpp)\n",sh->disp_w,sh->disp_h,sh->bih->biBitCount); if(trak->tkdata_len>81) mp_msg(MSGT_DEMUX, MSGL_V, "Display size: %d x %d\n", trak->tkdata[77]|(trak->tkdata[76]<<8), trak->tkdata[81]|(trak->tkdata[80]<<8)); mp_msg(MSGT_DEMUX, MSGL_V, "Fourcc: %.4s Codec: '%.*s'\n",(char *)&trak->fourcc,trak->stdata[42]&31,trak->stdata+43); // if(demuxer->video->id==-1 || demuxer->video->id==priv->track_db){ // // (auto)selected video track: // demuxer->video->id=priv->track_db; // demuxer->video->sh=sh; sh->ds=demuxer->video; // } return 1; } static void lschunks(demuxer_t* demuxer,int level,off_t endpos,mov_track_t* trak){ mov_priv_t* priv=demuxer->priv; // printf("lschunks (level=%d,endpos=%x)\n", level, endpos); while(1){ off_t pos; off_t len; unsigned int id; // pos=stream_tell(demuxer->stream); // printf("stream_tell==%d\n",pos); if(pos>=endpos) return; // END len=stream_read_dword(demuxer->stream); // printf("len==%d\n",len); if(len<8) return; // error len-=8; id=stream_read_dword(demuxer->stream); // mp_msg(MSGT_DEMUX,MSGL_DBG2,"lschunks %.4s %d\n",(char *)&id,(int)len); // if(trak){ if (lschunks_intrak(demuxer, level, id, pos, len, trak) < 0) return; } else { /* not in track */ switch(id) { case MOV_FOURCC('m','v','h','d'): { int version = stream_read_char(demuxer->stream); stream_skip(demuxer->stream, (version == 1) ? 19 : 11); priv->timescale=stream_read_dword(demuxer->stream); if (version == 1) priv->duration=stream_read_qword(demuxer->stream); else priv->duration=stream_read_dword(demuxer->stream); mp_msg(MSGT_DEMUX, MSGL_V,"MOV: %*sMovie header (%d bytes): tscale=%d dur=%d\n",level,"",(int)len, (int)priv->timescale,(int)priv->duration); break; } case MOV_FOURCC('t','r','a','k'): { // if(trak) printf("MOV: Warning! trak in trak?\n"); if(priv->track_db>=MOV_MAX_TRACKS){ mp_msg(MSGT_DEMUX,MSGL_WARN,MSGTR_MOVtooManyTrk); return; } if(!priv->track_db) mp_msg(MSGT_DEMUX, MSGL_V, "--------------\n"); trak=calloc(1, sizeof(mov_track_t)); mp_msg(MSGT_DEMUX,MSGL_V,"MOV: Track #%d:\n",priv->track_db); trak->id=priv->track_db; priv->tracks[priv->track_db]=trak; lschunks(demuxer,level+1,pos+len,trak); mov_build_index(trak,priv->timescale); switch(trak->type){ case MOV_TRAK_AUDIO: { sh_audio_t* sh=new_sh_audio(demuxer,priv->track_db, NULL); mp_msg(MSGT_DEMUX, MSGL_INFO, MSGTR_AudioID, "mov", priv->track_db); gen_sh_audio(sh, trak, priv->timescale); break; } case MOV_TRAK_VIDEO: { sh_video_t* sh=new_sh_video(demuxer,priv->track_db); mp_msg(MSGT_DEMUX, MSGL_INFO, MSGTR_VideoID, "mov", priv->track_db); gen_sh_video(sh, trak, priv->timescale); break; } case MOV_TRAK_GENERIC: if (trak->fourcc == mmioFOURCC('m','p','4','s') || trak->fourcc == mmioFOURCC('t','x','3','g') || trak->fourcc == mmioFOURCC('t','e','x','t')) { sh_sub_t *sh = new_sh_sub(demuxer, priv->track_db, NULL); mp_msg(MSGT_DEMUX, MSGL_INFO, MSGTR_SubtitleID, "mov", priv->track_db); if (trak->fourcc == mmioFOURCC('m','p','4','s')) init_vobsub(sh, trak); else { sh->type = 'm'; sub_utf8 = 1; } } else mp_msg(MSGT_DEMUX, MSGL_V, "Generic track - not completely understood! (id: %d)\n", trak->id); /* XXX: Also this contains the FLASH data */ #if 0 { int pos = stream_tell(demuxer->stream); int i; int fd; char name[20]; for (i=0; i<trak->samples_size; i++) { char buf[trak->samples[i].size]; stream_seek(demuxer->stream, trak->samples[i].pos); snprintf((char *)&name[0], 20, "samp%d", i); fd = open((char *)&name[0], O_CREAT|O_WRONLY); stream_read(demuxer->stream, &buf[0], trak->samples[i].size); write(fd, &buf[0], trak->samples[i].size); close(fd); } for (i=0; i<trak->chunks_size; i++) { char buf[trak->length]; stream_seek(demuxer->stream, trak->chunks[i].pos); snprintf((char *)&name[0], 20, "chunk%d", i); fd = open((char *)&name[0], O_CREAT|O_WRONLY); stream_read(demuxer->stream, &buf[0], trak->length); write(fd, &buf[0], trak->length); close(fd); } if (trak->samplesize > 0) { char *buf; buf = malloc(trak->samplesize); stream_seek(demuxer->stream, trak->chunks[0].pos); snprintf((char *)&name[0], 20, "trak%d", trak->id); fd = open((char *)&name[0], O_CREAT|O_WRONLY); stream_read(demuxer->stream, buf, trak->samplesize); write(fd, buf, trak->samplesize); close(fd); } stream_seek(demuxer->stream, pos); } #endif break; default: mp_msg(MSGT_DEMUX, MSGL_V, "Unknown track type found (type: %d)\n", trak->type); break; } mp_msg(MSGT_DEMUX, MSGL_V, "--------------\n"); priv->track_db++; trak=NULL; break; } #if !CONFIG_ZLIB case MOV_FOURCC('c','m','o','v'): { mp_msg(MSGT_DEMUX,MSGL_ERR,MSGTR_MOVcomprhdr); return; } #else case MOV_FOURCC('m','o','o','v'): case MOV_FOURCC('c','m','o','v'): { // mp_msg(MSGT_DEMUX,MSGL_ERR,MSGTR_MOVcomprhdr); lschunks(demuxer,level+1,pos+len,NULL); break; } case MOV_FOURCC('d','c','o','m'): { // int temp=stream_read_dword(demuxer->stream); unsigned int algo=be2me_32(stream_read_dword(demuxer->stream)); mp_msg(MSGT_DEMUX, MSGL_V, "Compressed header uses %.4s algo!\n",(char *)&algo); break; } case MOV_FOURCC('c','m','v','d'): { // int temp=stream_read_dword(demuxer->stream); unsigned int moov_sz=stream_read_dword(demuxer->stream); unsigned int cmov_sz=len-4; unsigned char* cmov_buf; unsigned char* moov_buf; int zret; z_stream zstrm; stream_t* backup; if (moov_sz > UINT_MAX - 16) { mp_msg(MSGT_DEMUX, MSGL_ERR, "Invalid cmvd atom size %d\n", moov_sz); break; } cmov_buf=malloc(cmov_sz); moov_buf=malloc(moov_sz+16); mp_msg(MSGT_DEMUX, MSGL_V, "Compressed header size: %d / %d\n",cmov_sz,moov_sz); stream_read(demuxer->stream,cmov_buf,cmov_sz); zstrm.zalloc = (alloc_func)0; zstrm.zfree = (free_func)0; zstrm.opaque = (voidpf)0; zstrm.next_in = cmov_buf; zstrm.avail_in = cmov_sz; zstrm.next_out = moov_buf; zstrm.avail_out = moov_sz; zret = inflateInit(&zstrm); if (zret != Z_OK) { mp_msg(MSGT_DEMUX, MSGL_ERR, "QT cmov: inflateInit err %d\n",zret); return; } zret = inflate(&zstrm, Z_NO_FLUSH); if ((zret != Z_OK) && (zret != Z_STREAM_END)) { mp_msg(MSGT_DEMUX, MSGL_ERR, "QT cmov inflate: ERR %d\n",zret); return; } #if 0 else { FILE *DecOut; DecOut = fopen("Out.bin", "w"); fwrite(moov_buf, 1, moov_sz, DecOut); fclose(DecOut); } #endif if(moov_sz != zstrm.total_out) mp_msg(MSGT_DEMUX, MSGL_WARN, "Warning! moov size differs cmov: %d zlib: %ld\n",moov_sz,zstrm.total_out); zret = inflateEnd(&zstrm); backup=demuxer->stream; demuxer->stream=new_memory_stream(moov_buf,moov_sz); stream_skip(demuxer->stream,8); lschunks(demuxer,level+1,moov_sz,NULL); // parse uncompr. 'moov' //free_stream(demuxer->stream); demuxer->stream=backup; free(cmov_buf); free(moov_buf); break; } #endif case MOV_FOURCC('u','d','t','a'): { unsigned int udta_id; off_t udta_len; off_t udta_size = len; mp_msg(MSGT_DEMUX, MSGL_DBG2, "mov: user data record found\n"); mp_msg(MSGT_DEMUX, MSGL_V, "Quicktime Clip Info:\n"); while((len > 8) && (udta_size > 8)) { udta_len = stream_read_dword(demuxer->stream); udta_id = stream_read_dword(demuxer->stream); udta_size -= 8; mp_msg(MSGT_DEMUX, MSGL_DBG2, "udta_id: %.4s (len: %"PRId64")\n", (char *)&udta_id, (int64_t)udta_len); switch (udta_id) { case MOV_FOURCC(0xa9,'c','p','y'): case MOV_FOURCC(0xa9,'d','a','y'): case MOV_FOURCC(0xa9,'d','i','r'): /* 0xa9,'e','d','1' - '9' : edit timestamps */ case MOV_FOURCC(0xa9,'f','m','t'): case MOV_FOURCC(0xa9,'i','n','f'): case MOV_FOURCC(0xa9,'p','r','d'): case MOV_FOURCC(0xa9,'p','r','f'): case MOV_FOURCC(0xa9,'r','e','q'): case MOV_FOURCC(0xa9,'s','r','c'): case MOV_FOURCC('n','a','m','e'): case MOV_FOURCC(0xa9,'n','a','m'): case MOV_FOURCC(0xa9,'A','R','T'): case MOV_FOURCC(0xa9,'c','m','t'): case MOV_FOURCC(0xa9,'a','u','t'): case MOV_FOURCC(0xa9,'s','w','r'): { off_t text_len = stream_read_word(demuxer->stream); char text[text_len+2+1]; stream_read(demuxer->stream, (char *)&text, text_len+2); text[text_len+2] = 0x0; switch(udta_id) { case MOV_FOURCC(0xa9,'a','u','t'): demux_info_add(demuxer, "author", &text[2]); mp_msg(MSGT_DEMUX, MSGL_V, " Author: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'c','p','y'): demux_info_add(demuxer, "copyright", &text[2]); mp_msg(MSGT_DEMUX, MSGL_V, " Copyright: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'i','n','f'): mp_msg(MSGT_DEMUX, MSGL_V, " Info: %s\n", &text[2]); break; case MOV_FOURCC('n','a','m','e'): case MOV_FOURCC(0xa9,'n','a','m'): demux_info_add(demuxer, "title", &text[2]); mp_msg(MSGT_DEMUX, MSGL_V, " Name: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'A','R','T'): mp_msg(MSGT_DEMUX, MSGL_V, " Artist: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'d','i','r'): mp_msg(MSGT_DEMUX, MSGL_V, " Director: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'c','m','t'): demux_info_add(demuxer, "comments", &text[2]); mp_msg(MSGT_DEMUX, MSGL_V, " Comment: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'r','e','q'): mp_msg(MSGT_DEMUX, MSGL_V, " Requirements: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'s','w','r'): demux_info_add(demuxer, "encoder", &text[2]); mp_msg(MSGT_DEMUX, MSGL_V, " Software: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'d','a','y'): mp_msg(MSGT_DEMUX, MSGL_V, " Creation timestamp: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'f','m','t'): mp_msg(MSGT_DEMUX, MSGL_V, " Format: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'p','r','d'): mp_msg(MSGT_DEMUX, MSGL_V, " Producer: %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'p','r','f'): mp_msg(MSGT_DEMUX, MSGL_V, " Performer(s): %s\n", &text[2]); break; case MOV_FOURCC(0xa9,'s','r','c'): mp_msg(MSGT_DEMUX, MSGL_V, " Source providers: %s\n", &text[2]); break; } udta_size -= 4+text_len; break; } /* some other shits: WLOC - window location, LOOP - looping style, SelO - play only selected frames AllF - play all frames */ case MOV_FOURCC('W','L','O','C'): case MOV_FOURCC('L','O','O','P'): case MOV_FOURCC('S','e','l','O'): case MOV_FOURCC('A','l','l','F'): default: { if( udta_len>udta_size) udta_len=udta_size; { stream_skip(demuxer->stream, udta_len-4-4); udta_size -= udta_len; } } } } break; } /* eof udta */ default: id = be2me_32(id); mp_msg(MSGT_DEMUX,MSGL_V,"MOV: unknown chunk: %.4s %d\n",(char *)&id,(int)len); } /* endof switch */ } /* endof else */ pos+=len+8; if(pos>=endpos) break; if(!stream_seek(demuxer->stream,pos)) break; } } static int lschunks_intrak(demuxer_t* demuxer, int level, unsigned int id, off_t pos, off_t len, mov_track_t* trak) { switch(id) { case MOV_FOURCC('m','d','a','t'): { mp_msg(MSGT_DEMUX,MSGL_WARN,"Hmm, strange MOV, parsing mdat in lschunks?\n"); return -1; } case MOV_FOURCC('f','r','e','e'): case MOV_FOURCC('u','d','t','a'): /* here not supported :p */ break; case MOV_FOURCC('t','k','h','d'): { mp_msg(MSGT_DEMUX,MSGL_V,"MOV: %*sTrack header!\n", level, ""); // read codec data trak->tkdata_len = len; trak->tkdata = malloc(trak->tkdata_len); stream_read(demuxer->stream, trak->tkdata, trak->tkdata_len); /* 0 1 Version 1 3 Flags 4 4 Creation time 8 4 Modification time 12 4 Track ID 16 4 Reserved 20 4 Duration 24 8 Reserved 32 2 Layer 34 2 Alternate group 36 2 Volume 38 2 Reserved 40 36 Matrix structure 76 4 Track width 80 4 Track height */ mp_msg(MSGT_DEMUX, MSGL_V, "tkhd len=%d ver=%d flags=0x%X id=%d dur=%d lay=%d vol=%d\n", trak->tkdata_len, trak->tkdata[0], trak->tkdata[1], char2int(trak->tkdata, 12), // id char2int(trak->tkdata, 20), // duration char2short(trak->tkdata, 32), // layer char2short(trak->tkdata, 36)); // volume break; } case MOV_FOURCC('m','d','h','d'): { int version = stream_read_char(demuxer->stream); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sMedia header!\n", level, ""); stream_skip(demuxer->stream, (version == 1) ? 19 : 11); // read timescale trak->timescale = stream_read_dword(demuxer->stream); // read length if (version == 1) trak->length = stream_read_qword(demuxer->stream); else trak->length = stream_read_dword(demuxer->stream); break; } case MOV_FOURCC('h','d','l','r'): { av_unused unsigned int tmp = stream_read_dword(demuxer->stream); unsigned int type = stream_read_dword_le(demuxer->stream); unsigned int subtype = stream_read_dword_le(demuxer->stream); unsigned int manufact = stream_read_dword_le(demuxer->stream); av_unused unsigned int comp_flags = stream_read_dword(demuxer->stream); av_unused unsigned int comp_mask = stream_read_dword(demuxer->stream); int len = stream_read_char(demuxer->stream); char* str = malloc(len + 1); stream_read(demuxer->stream, str, len); str[len] = 0; mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sHandler header: %.4s/%.4s (%.4s) %s\n", level, "", (char *)&type, (char *)&subtype, (char *)&manufact, str); free(str); switch(bswap_32(type)) { case MOV_FOURCC('m','h','l','r'): trak->media_handler = bswap_32(subtype); break; case MOV_FOURCC('d','h','l','r'): trak->data_handler = bswap_32(subtype); break; default: mp_msg(MSGT_DEMUX, MSGL_V, "MOV: unknown handler class: 0x%X (%.4s)\n", bswap_32(type), (char *)&type); } break; } case MOV_FOURCC('v','m','h','d'): { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sVideo header!\n", level, ""); trak->type = MOV_TRAK_VIDEO; // read video data break; } case MOV_FOURCC('s','m','h','d'): { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sSound header!\n", level, ""); trak->type = MOV_TRAK_AUDIO; // read audio data break; } case MOV_FOURCC('g','m','h','d'): { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sGeneric header!\n", level, ""); trak->type = MOV_TRAK_GENERIC; break; } case MOV_FOURCC('n','m','h','d'): { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sGeneric header!\n", level, ""); trak->type = MOV_TRAK_GENERIC; break; } case MOV_FOURCC('s','t','s','d'): { int i = stream_read_dword(demuxer->stream); // temp! int count = stream_read_dword(demuxer->stream); mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sDescription list! (cnt:%d)\n", level, "", count); for (i = 0; i < count; i++) { off_t pos = stream_tell(demuxer->stream); off_t len = stream_read_dword(demuxer->stream); unsigned int fourcc = stream_read_dword_le(demuxer->stream); /* some files created with Broadcast 2000 (e.g. ilacetest.mov) contain raw I420 video but have a yv12 fourcc */ if (fourcc == mmioFOURCC('y','v','1','2')) fourcc = mmioFOURCC('I','4','2','0'); if (len < 8) break; // error mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*s desc #%d: %.4s (%"PRId64" bytes)\n", level, "", i, (char *)&fourcc, (int64_t)len - 16); if (fourcc != trak->fourcc && i) mp_msg(MSGT_DEMUX, MSGL_WARN, MSGTR_MOVvariableFourCC); // if(!i) { trak->fourcc = fourcc; // read type specific (audio/video/time/text etc) header // NOTE: trak type is not yet known at this point :((( trak->stdata_len = len - 8; trak->stdata = malloc(trak->stdata_len); stream_read(demuxer->stream, trak->stdata, trak->stdata_len); } if (!stream_seek(demuxer->stream, pos + len)) break; } break; } case MOV_FOURCC('s','t','t','s'): { av_unused int temp = stream_read_dword(demuxer->stream); int len = stream_read_dword(demuxer->stream); int i; unsigned int pts = 0; mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sSample duration table! (%d blocks)\n", level, "", len); free(trak->durmap); trak->durmap = calloc(len, sizeof(mov_durmap_t)); trak->durmap_size = trak->durmap ? len : 0; for (i = 0; i < trak->durmap_size; i++) { trak->durmap[i].num = stream_read_dword(demuxer->stream); trak->durmap[i].dur = stream_read_dword(demuxer->stream); pts += trak->durmap[i].num * trak->durmap[i].dur; } if (trak->length != pts) mp_msg(MSGT_DEMUX, MSGL_WARN, "Warning! pts=%d length=%d\n", pts, trak->length); break; } case MOV_FOURCC('s','t','s','c'): { int temp = stream_read_dword(demuxer->stream); int len = stream_read_dword(demuxer->stream); int ver = (temp << 24); int flags = (temp << 16) | (temp << 8) | temp; int i; mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sSample->Chunk mapping table! (%d blocks) (ver:%d,flags:%d)\n", level, "", len, ver, flags); // read data: free(trak->chunkmap); trak->chunkmap = calloc(len, sizeof(mov_chunkmap_t)); trak->chunkmap_size = trak->chunkmap ? len : 0; for (i = 0; i < trak->chunkmap_size; i++) { trak->chunkmap[i].first = stream_read_dword(demuxer->stream) - 1; trak->chunkmap[i].spc = stream_read_dword(demuxer->stream); trak->chunkmap[i].sdid = stream_read_dword(demuxer->stream); } break; } case MOV_FOURCC('s','t','s','z'): { int temp = stream_read_dword(demuxer->stream); int ss=stream_read_dword(demuxer->stream); int ver = (temp << 24); int flags = (temp << 16) | (temp << 8) | temp; int entries = stream_read_dword(demuxer->stream); int i; mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sSample size table! (entries=%d ss=%d) (ver:%d,flags:%d)\n", level, "", entries, ss, ver, flags); trak->samplesize = ss; if (!ss) { // variable samplesize free(trak->samples); trak->samples = calloc(entries, sizeof(mov_sample_t)); trak->samples_size = trak->samples ? entries : 0; for (i = 0; i < trak->samples_size; i++) trak->samples[i].size = stream_read_dword(demuxer->stream); } break; } case MOV_FOURCC('s','t','c','o'): { av_unused int temp = stream_read_dword(demuxer->stream); int len = stream_read_dword(demuxer->stream); int i; mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sChunk offset table! (%d chunks)\n", level, "", len); // extend array if needed: if (len > trak->chunks_size) { free(trak->chunks); trak->chunks = calloc(len, sizeof(mov_chunk_t)); trak->chunks_size = trak->chunks ? len : 0; } // read elements: for(i = 0; i < trak->chunks_size; i++) trak->chunks[i].pos = stream_read_dword(demuxer->stream); break; } case MOV_FOURCC('c','o','6','4'): { av_unused int temp = stream_read_dword(demuxer->stream); int len = stream_read_dword(demuxer->stream); int i; mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*s64bit chunk offset table! (%d chunks)\n", level, "", len); // extend array if needed: if (len > trak->chunks_size) { free(trak->chunks); trak->chunks = calloc(len, sizeof(mov_chunk_t)); trak->chunks_size = trak->chunks ? len : 0; } // read elements: for (i = 0; i < trak->chunks_size; i++) { #ifndef _LARGEFILE_SOURCE if (stream_read_dword(demuxer->stream) != 0) mp_msg(MSGT_DEMUX, MSGL_WARN, "Chunk %d has got 64bit address, but you've MPlayer compiled without LARGEFILE support!\n", i); trak->chunks[i].pos = stream_read_dword(demuxer->stream); #else trak->chunks[i].pos = stream_read_qword(demuxer->stream); #endif } break; } case MOV_FOURCC('s','t','s','s'): { int temp = stream_read_dword(demuxer->stream); int entries = stream_read_dword(demuxer->stream); int ver = (temp << 24); int flags = (temp << 16) | (temp<<8) | temp; int i; mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sSyncing samples (keyframes) table! (%d entries) (ver:%d,flags:%d)\n", level, "", entries, ver, flags); free(trak->keyframes); trak->keyframes = calloc(entries, sizeof(unsigned int)); trak->keyframes_size = trak->keyframes ? entries : 0; for (i = 0; i < trak->keyframes_size; i++) trak->keyframes[i] = stream_read_dword(demuxer->stream) - 1; break; } case MOV_FOURCC('m','d','i','a'): { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sMedia stream!\n", level, ""); lschunks(demuxer, level + 1, pos + len, trak); break; } case MOV_FOURCC('m','i','n','f'): { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sMedia info!\n", level, ""); lschunks(demuxer, level + 1 ,pos + len, trak); break; } case MOV_FOURCC('s','t','b','l'): { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sSample info!\n", level, ""); lschunks(demuxer, level + 1, pos + len, trak); break; } case MOV_FOURCC('e','d','t','s'): { mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sEdit atom!\n", level, ""); lschunks(demuxer, level + 1, pos + len, trak); break; } case MOV_FOURCC('e','l','s','t'): { int temp = stream_read_dword(demuxer->stream); int entries = stream_read_dword(demuxer->stream); int ver = (temp << 24); int flags = (temp << 16) | (temp << 8) | temp; int i; mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*sEdit list table (%d entries) (ver:%d,flags:%d)\n", level, "", entries, ver, flags); #if 1 free(trak->editlist); trak->editlist = calloc(entries, sizeof(mov_editlist_t)); trak->editlist_size = trak->editlist ? entries : 0; for (i = 0; i < trak->editlist_size; i++) { int dur = stream_read_dword(demuxer->stream); int mt = stream_read_dword(demuxer->stream); int mr = stream_read_dword(demuxer->stream); // 16.16fp trak->editlist[i].dur = dur; trak->editlist[i].pos = mt; trak->editlist[i].speed = mr; mp_msg(MSGT_DEMUX, MSGL_V, "MOV: %*s entry#%d: duration: %d start time: %d speed: %3.1fx\n", level, "", i, dur, mt, (float)mr/65536.0f); } #endif break; } case MOV_FOURCC('c','o','d','e'): { /* XXX: Implement atom 'code' for FLASH support */ break; } default: id = be2me_32(id); mp_msg(MSGT_DEMUX,MSGL_V,"MOV: unknown chunk: %.4s %d\n",(char *)&id,(int)len); break; }//switch(id) return 0; } static demuxer_t* mov_read_header(demuxer_t* demuxer){ mov_priv_t* priv=demuxer->priv; int t_no; int best_a_id=-1, best_a_len=0; int best_v_id=-1, best_v_len=0; mp_msg(MSGT_DEMUX, MSGL_DBG3, "mov_read_header!\n"); // Parse header: stream_reset(demuxer->stream); if(!stream_seek(demuxer->stream,priv->moov_start)) { mp_msg(MSGT_DEMUX,MSGL_ERR,"MOV: Cannot seek to the beginning of the Movie header (0x%"PRIx64")\n", (int64_t)priv->moov_start); return 0; } lschunks(demuxer, 0, priv->moov_end, NULL); // just in case we have hit eof while parsing... demuxer->stream->eof = 0; // mp_msg(MSGT_DEMUX, MSGL_INFO, "--------------\n"); // find the best (longest) streams: for(t_no=0;t_no<priv->track_db;t_no++){ mov_track_t* trak=priv->tracks[t_no]; int len=(trak->samplesize) ? trak->chunks_size : trak->samples_size; if(demuxer->a_streams[t_no]){ // need audio if(len>best_a_len){ best_a_len=len; best_a_id=t_no; } } if(demuxer->v_streams[t_no]){ // need video if(len>best_v_len){ best_v_len=len; best_v_id=t_no; } } } mp_msg(MSGT_DEMUX, MSGL_V, "MOV: longest streams: A: #%d (%d samples) V: #%d (%d samples)\n", best_a_id,best_a_len,best_v_id,best_v_len); if(demuxer->audio->id==-1 && best_a_id>=0) demuxer->audio->id=best_a_id; if(demuxer->video->id==-1 && best_v_id>=0) demuxer->video->id=best_v_id; // setup sh pointers: if(demuxer->audio->id>=0){ sh_audio_t* sh=demuxer->a_streams[demuxer->audio->id]; if(sh){ demuxer->audio->sh=sh; sh->ds=demuxer->audio; } else { mp_msg(MSGT_DEMUX, MSGL_ERR, "MOV: selected audio stream (%d) does not exist\n",demuxer->audio->id); demuxer->audio->id=-2; } } if(demuxer->video->id>=0){ sh_video_t* sh=demuxer->v_streams[demuxer->video->id]; if(sh){ demuxer->video->sh=sh; sh->ds=demuxer->video; } else { mp_msg(MSGT_DEMUX, MSGL_ERR, "MOV: selected video stream (%d) does not exist\n",demuxer->video->id); demuxer->video->id=-2; } } if(demuxer->sub->id>=0){ sh_sub_t* sh=demuxer->s_streams[demuxer->sub->id]; if(sh){ demuxer->sub->sh=sh; } else { mp_msg(MSGT_DEMUX, MSGL_ERR, "MOV: selected subtitle stream (%d) does not exist\n",demuxer->sub->id); demuxer->sub->id=-2; } } if(demuxer->video->id<0 && demuxer->audio->id<0) { /* No AV streams found. Try to find an MPEG stream. */ for(t_no=0;t_no<priv->track_db;t_no++){ mov_track_t* trak=priv->tracks[t_no]; if(trak->media_handler == MOV_FOURCC('M','P','E','G')) { stream_t *s; demuxer_t *od; demuxer->video->id = t_no; s = new_ds_stream(demuxer->video); od = demux_open(s, DEMUXER_TYPE_MPEG_PS, -1, -1, -1, NULL); if(od) return new_demuxers_demuxer(od, od, od); demuxer->video->id = -2; //new linked demuxer couldn't be allocated break; } } } #if 0 if( mp_msg_test(MSGT_DEMUX,MSGL_DBG3) ){ for(t_no=0;t_no<priv->track_db;t_no++){ mov_track_t* trak=priv->tracks[t_no]; if(trak->type==MOV_TRAK_GENERIC){ int i; int fd; char name[20]; mp_msg(MSGT_DEMUX, MSGL_INFO, "MOV: Track #%d: Extracting %d data chunks to files\n",t_no,trak->samples_size); for (i=0; i<trak->samples_size; i++) { int len=trak->samples[i].size; char buf[len]; stream_seek(demuxer->stream, trak->samples[i].pos); snprintf(name, 20, "t%02d-s%03d.%s", t_no,i, (trak->media_handler==MOV_FOURCC('f','l','s','h')) ? "swf":"dump"); fd = open(name, O_CREAT|O_WRONLY); // { int j; // for(j=0;j<trak->stdata_len-3; j++) // printf("stdata[%d]=0x%X ize=0x%X\n",j,char2int(trak->stdata,j),MOV_FOURCC('z','l','i','b')); // } if( //trak->media_handler==MOV_FOURCC('s','p','r','t') && trak->stdata_len>=16 && char2int(trak->stdata,12)==MOV_FOURCC('z','l','i','b') ){ int newlen=stream_read_dword(demuxer->stream); #if CONFIG_ZLIB // unzip: z_stream zstrm; int zret; char buf2[newlen]; len-=4; stream_read(demuxer->stream, buf, len); zstrm.zalloc = (alloc_func)0; zstrm.zfree = (free_func)0; zstrm.opaque = (voidpf)0; zstrm.next_in = buf; zstrm.avail_in = len; zstrm.next_out = buf2; zstrm.avail_out = newlen; zret = inflateInit(&zstrm); zret = inflate(&zstrm, Z_NO_FLUSH); if(newlen != zstrm.total_out) mp_msg(MSGT_DEMUX, MSGL_WARN, "Warning! unzipped frame size differs hdr: %d zlib: %ld\n",newlen,zstrm.total_out); write(fd, buf2, newlen); } else { #else len-=4; mp_msg(MSGT_DEMUX, MSGL_INFO, "******* ZLIB COMPRESSED SAMPLE!!!!! (%d->%d bytes) *******\n",len,newlen); } { #endif stream_read(demuxer->stream, buf, len); write(fd, buf, len); } close(fd); } } } } demuxer->stream->eof = 0; #endif return demuxer; } /** * \brief return the mov track that belongs to a demuxer stream * \param ds the demuxer stream, may be NULL * \return the mov track info structure belonging to the stream, * NULL if not found */ static mov_track_t *stream_track(mov_priv_t *priv, demux_stream_t *ds) { if (ds && (ds->id >= 0) && (ds->id < priv->track_db)) return priv->tracks[ds->id]; return NULL; } // return value: // 0 = EOF or no stream found // 1 = successfully read a packet static int demux_mov_fill_buffer(demuxer_t *demuxer,demux_stream_t* ds){ mov_priv_t* priv=demuxer->priv; mov_track_t* trak=NULL; float pts; int x; off_t pos; if (ds->eof) return 0; trak = stream_track(priv, ds); if (!trak) return 0; if(trak->samplesize){ // read chunk: if(trak->pos>=trak->chunks_size) return 0; // EOF stream_seek(demuxer->stream,trak->chunks[trak->pos].pos); pts=(float)(trak->chunks[trak->pos].sample*trak->duration)/(float)trak->timescale; if(trak->samplesize!=1) { mp_msg(MSGT_DEMUX, MSGL_DBG2, "WARNING! Samplesize(%d) != 1\n", trak->samplesize); if((trak->fourcc != MOV_FOURCC('t','w','o','s')) && (trak->fourcc != MOV_FOURCC('s','o','w','t'))) x=trak->chunks[trak->pos].size*trak->samplesize; else x=trak->chunks[trak->pos].size; } else x=trak->chunks[trak->pos].size; // printf("X = %d\n", x); /* the following stuff is audio related */ if (trak->type == MOV_TRAK_AUDIO){ if(trak->stdata_len>=44 && trak->stdata[9]>=1 && char2int(trak->stdata,28)>0){ // stsd version 1 - we have audio compression ratio info: x/=char2int(trak->stdata,28); // samples/packet // x*=char2int(trak->stdata,32); // bytes/packet x*=char2int(trak->stdata,36); // bytes/frame } else { if(ds->ss_div && ds->ss_mul){ // workaround for buggy files like 7up-high-traffic-areas.mov, // with missing stsd v1 header containing compression rate x/=ds->ss_div; x*=ds->ss_mul; // compression ratio fix ! HACK ! } else { x*=trak->nchannels; x*=trak->samplebytes; } } mp_msg(MSGT_DEMUX, MSGL_DBG2, "Audio sample %d bytes pts %5.3f\n",trak->chunks[trak->pos].size*trak->samplesize,pts); } /* MOV_TRAK_AUDIO */ pos=trak->chunks[trak->pos].pos; } else { int frame=trak->pos; // editlist support: if(trak->type == MOV_TRAK_VIDEO && trak->editlist_size>=1){ // find the right editlist entry: if(frame<trak->editlist[trak->editlist_pos].start_frame) trak->editlist_pos=0; while(trak->editlist_pos<trak->editlist_size-1 && frame>=trak->editlist[trak->editlist_pos+1].start_frame) ++trak->editlist_pos; if(frame>=trak->editlist[trak->editlist_pos].start_frame+ trak->editlist[trak->editlist_pos].frames) return 0; // EOF // calc real frame index: frame-=trak->editlist[trak->editlist_pos].start_frame; frame+=trak->editlist[trak->editlist_pos].start_sample; // calc pts: pts=(float)(trak->samples[frame].pts+ trak->editlist[trak->editlist_pos].pts_offset)/(float)trak->timescale; } else { if(frame>=trak->samples_size) return 0; // EOF pts=(float)trak->samples[frame].pts/(float)trak->timescale; } // read sample: stream_seek(demuxer->stream,trak->samples[frame].pos); x=trak->samples[frame].size; pos=trak->samples[frame].pos; } if(trak->pos==0 && trak->stream_header_len>0){ // we have to append the stream header... demux_packet_t* dp=new_demux_packet(x+trak->stream_header_len); memcpy(dp->buffer,trak->stream_header,trak->stream_header_len); stream_read(demuxer->stream,dp->buffer+trak->stream_header_len,x); free(trak->stream_header); trak->stream_header = NULL; trak->stream_header_len = 0; dp->pts=pts; dp->flags=0; dp->pos=pos; // FIXME? ds_add_packet(ds,dp); } else ds_read_packet(ds,demuxer->stream,x,pts,pos,0); ++trak->pos; trak = NULL; if (demuxer->sub->id >= 0 && demuxer->sub->id < priv->track_db) trak = priv->tracks[demuxer->sub->id]; if (trak) { int samplenr = 0; while (samplenr < trak->samples_size) { double subpts = (double)trak->samples[samplenr].pts / (double)trak->timescale; if (subpts >= pts) break; samplenr++; } samplenr--; if (samplenr < 0) vo_sub = NULL; else if (samplenr != priv->current_sub) { off_t pos = trak->samples[samplenr].pos; int len = trak->samples[samplenr].size; double subpts = (double)trak->samples[samplenr].pts / (double)trak->timescale; stream_seek(demuxer->stream, pos); ds_read_packet(demuxer->sub, demuxer->stream, len, subpts, pos, 0); priv->current_sub = samplenr; } } return 1; } static float mov_seek_track(mov_track_t* trak,float pts,int flags){ // printf("MOV track seek called %5.3f \n",pts); if(flags&SEEK_FACTOR) pts*=trak->length; else pts*=(float)trak->timescale; if(trak->samplesize){ int sample=pts/trak->duration; // printf("MOV track seek - chunk: %d (pts: %5.3f dur=%d) \n",sample,pts,trak->duration); if(!(flags&SEEK_ABSOLUTE)) sample+=trak->chunks[trak->pos].sample; // relative trak->pos=0; while(trak->pos<trak->chunks_size && trak->chunks[trak->pos].sample<sample) ++trak->pos; if (trak->pos == trak->chunks_size) return -1; pts=(float)(trak->chunks[trak->pos].sample*trak->duration)/(float)trak->timescale; } else { unsigned int ipts; if(!(flags&SEEK_ABSOLUTE)) pts+=trak->samples[trak->pos].pts; if(pts<0) pts=0; ipts=pts; //printf("MOV track seek - sample: %d \n",ipts); for(trak->pos=0;trak->pos<trak->samples_size;++trak->pos){ if(trak->samples[trak->pos].pts>=ipts) break; // found it! } if (trak->pos == trak->samples_size) return -1; if(trak->keyframes_size){ // find nearest keyframe int i; for(i=0;i<trak->keyframes_size;i++){ if(trak->keyframes[i]>=trak->pos) break; } if (i == trak->keyframes_size) return -1; if(i>0 && (trak->keyframes[i]-trak->pos) > (trak->pos-trak->keyframes[i-1])) --i; trak->pos=trak->keyframes[i]; // printf("nearest keyframe: %d \n",trak->pos); } pts=(float)trak->samples[trak->pos].pts/(float)trak->timescale; } // printf("MOV track seek done: %5.3f \n",pts); return pts; } static void demux_seek_mov(demuxer_t *demuxer,float pts,float audio_delay,int flags){ mov_priv_t* priv=demuxer->priv; demux_stream_t* ds; mov_track_t* trak; // printf("MOV seek called %5.3f flag=%d \n",pts,flags); ds=demuxer->video; trak = stream_track(priv, ds); if (trak) { //if(flags&2) pts*=(float)trak->length/(float)trak->timescale; //if(!(flags&1)) pts+=ds->pts; ds->pts=mov_seek_track(trak,pts,flags); if (ds->pts < 0) ds->eof = 1; else pts = ds->pts; flags=1; // absolute seconds } ds=demuxer->audio; trak = stream_track(priv, ds); if (trak) { //if(flags&2) pts*=(float)trak->length/(float)trak->timescale; //if(!(flags&1)) pts+=ds->pts; ds->pts=mov_seek_track(trak,pts,flags); if (ds->pts < 0) ds->eof = 1; } } static int demux_mov_control(demuxer_t *demuxer, int cmd, void *arg){ mov_track_t* track; // try the video track track = stream_track(demuxer->priv, demuxer->video); if (!track || !track->length) // otherwise try to get the info from the audio track track = stream_track(demuxer->priv, demuxer->audio); if (!track || !track->length) return DEMUXER_CTRL_DONTKNOW; switch(cmd) { case DEMUXER_CTRL_GET_TIME_LENGTH: if (!track->timescale) return DEMUXER_CTRL_DONTKNOW; *((double *)arg) = (double)track->length / track->timescale; return DEMUXER_CTRL_OK; case DEMUXER_CTRL_GET_PERCENT_POS: { off_t pos = track->pos; if (track->durmap_size >= 1) pos *= track->durmap[0].dur; *((int *)arg) = (int)(100 * pos / track->length); return DEMUXER_CTRL_OK; } } return DEMUXER_CTRL_NOTIMPL; } const demuxer_desc_t demuxer_desc_mov = { "Quicktime/MP4 demuxer", "mov", "Quicktime/MOV", "Arpi, Al3x, Atmos, others", "Handles Quicktime, MP4, 3GP", DEMUXER_TYPE_MOV, 0, // slow autodetect mov_check_file, demux_mov_fill_buffer, mov_read_header, demux_close_mov, demux_seek_mov, demux_mov_control };