Mercurial > mplayer.hg
view stream/url.c @ 27518:e54c9b7eb0d8
Revert bad changes to SSA/ASS subtitle packet format
The following commits are reverted partially or completely:
"a valid ASS line contains 9 ',' before actual text"
"demux_mkv: output correctly formated ASS packets"
"libass: add a new ass_process_data() to process demuxed subtitle packets"
These commits converted the internal representation of SSA/ASS
subtitle packets from the format used by Matroska to a custom format
where each packet has contents exactly matching one line in complete
SSA script files. AFAIK no files natively use such a format for muxed
subtitles. The stated reason for this change was to use a format that
could in principle be muxed into a maximal number of containers. SSA
subtitles do not have an implicit duration so both start time and
duration or end time need to be specified explicitly; the new format
moved timing information inside the codec packet data so it could be
muxed without modification into containers that can represent only
start time at the container level. However such a change is wrong from
the viewpoint of program architecture. Timing information belongs to
the demuxer level, but these commits moved not only the duration but
also the authoritative value of the start time to inside the codec
data. Additionally the new format lost the value of the Matroska
ReadOrder field which is used by MPlayer.
This commit changes the internal packet format back to that used by
Matroska and makes the internal Matroska demuxer output that format
again. Libavformat still outputs the "new" format; it could be
converted back to the Matroska format in demux_lavf.c, but I'm not
adding that code at least yet. The current lavf code has similar
problems as the reverted code in MPlayer, and it also currently fails
to provide any way to access the value of the ReadOrder field. I hope
that the lavf side will be improved; if it isn't conversion can be
added later. For now I'll make MPlayer default to the internal Matroska
demuxer instead of the lavf one in a separate commit.
author | uau |
---|---|
date | Mon, 08 Sep 2008 21:26:22 +0000 |
parents | e96b4070ba66 |
children | 0f1b5b68af32 |
line wrap: on
line source
/* * URL Helper * by Bertrand Baudet <bertrand_baudet@yahoo.com> * (C) 2001, MPlayer team. * */ #include <string.h> #include <stdlib.h> #include <stdio.h> #include <ctype.h> #include <inttypes.h> #include "url.h" #include "mp_msg.h" #include "help_mp.h" #ifndef SIZE_MAX #define SIZE_MAX ((size_t)-1) #endif URL_t *url_redirect(URL_t **url, const char *redir) { URL_t *u = *url; URL_t *res; if (!strchr(redir, '/') || *redir == '/') { char *tmp; char *newurl = malloc(strlen(u->url) + strlen(redir) + 1); strcpy(newurl, u->url); if (*redir == '/') { redir++; tmp = strstr(newurl, "://"); if (tmp) tmp = strchr(tmp + 3, '/'); } else tmp = strrchr(newurl, '/'); if (tmp) tmp[1] = 0; strcat(newurl, redir); res = url_new(newurl); free(newurl); } else res = url_new(redir); url_free(u); *url = res; return res; } URL_t* url_new(const char* url) { int pos1, pos2,v6addr = 0; URL_t* Curl = NULL; char *escfilename=NULL; char *ptr1=NULL, *ptr2=NULL, *ptr3=NULL, *ptr4=NULL; int jumpSize = 3; if( url==NULL ) return NULL; if (strlen(url) > (SIZE_MAX / 3 - 1)) { mp_msg(MSGT_NETWORK,MSGL_FATAL,MSGTR_MemAllocFailed); goto err_out; } escfilename=malloc(strlen(url)*3+1); if (!escfilename ) { mp_msg(MSGT_NETWORK,MSGL_FATAL,MSGTR_MemAllocFailed); goto err_out; } // Create the URL container Curl = malloc(sizeof(URL_t)); if( Curl==NULL ) { mp_msg(MSGT_NETWORK,MSGL_FATAL,MSGTR_MemAllocFailed); goto err_out; } // Initialisation of the URL container members memset( Curl, 0, sizeof(URL_t) ); url_escape_string(escfilename,url); // Copy the url in the URL container Curl->url = strdup(escfilename); if( Curl->url==NULL ) { mp_msg(MSGT_NETWORK,MSGL_FATAL,MSGTR_MemAllocFailed); goto err_out; } mp_msg(MSGT_OPEN,MSGL_V,"Filename for url is now %s\n",escfilename); // extract the protocol ptr1 = strstr(escfilename, "://"); if( ptr1==NULL ) { // Check for a special case: "sip:" (without "//"): if (strstr(escfilename, "sip:") == escfilename) { ptr1 = (char *)&url[3]; // points to ':' jumpSize = 1; } else { mp_msg(MSGT_NETWORK,MSGL_V,"Not an URL!\n"); goto err_out; } } pos1 = ptr1-escfilename; Curl->protocol = malloc(pos1+1); if( Curl->protocol==NULL ) { mp_msg(MSGT_NETWORK,MSGL_FATAL,MSGTR_MemAllocFailed); goto err_out; } strncpy(Curl->protocol, escfilename, pos1); Curl->protocol[pos1] = '\0'; // jump the "://" ptr1 += jumpSize; pos1 += jumpSize; // check if a username:password is given ptr2 = strstr(ptr1, "@"); ptr3 = strstr(ptr1, "/"); if( ptr3!=NULL && ptr3<ptr2 ) { // it isn't really a username but rather a part of the path ptr2 = NULL; } if( ptr2!=NULL ) { // We got something, at least a username... int len = ptr2-ptr1; Curl->username = malloc(len+1); if( Curl->username==NULL ) { mp_msg(MSGT_NETWORK,MSGL_FATAL,MSGTR_MemAllocFailed); goto err_out; } strncpy(Curl->username, ptr1, len); Curl->username[len] = '\0'; ptr3 = strstr(ptr1, ":"); if( ptr3!=NULL && ptr3<ptr2 ) { // We also have a password int len2 = ptr2-ptr3-1; Curl->username[ptr3-ptr1]='\0'; Curl->password = malloc(len2+1); if( Curl->password==NULL ) { mp_msg(MSGT_NETWORK,MSGL_FATAL,MSGTR_MemAllocFailed); goto err_out; } strncpy( Curl->password, ptr3+1, len2); Curl->password[len2]='\0'; } ptr1 = ptr2+1; pos1 = ptr1-escfilename; } // before looking for a port number check if we have an IPv6 type numeric address // in IPv6 URL the numeric address should be inside square braces. ptr2 = strstr(ptr1, "["); ptr3 = strstr(ptr1, "]"); ptr4 = strstr(ptr1, "/"); if( ptr2!=NULL && ptr3!=NULL && ptr2 < ptr3 && (!ptr4 || ptr4 > ptr3)) { // we have an IPv6 numeric address ptr1++; pos1++; ptr2 = ptr3; v6addr = 1; } else { ptr2 = ptr1; } // look if the port is given ptr2 = strstr(ptr2, ":"); // If the : is after the first / it isn't the port ptr3 = strstr(ptr1, "/"); if(ptr3 && ptr3 - ptr2 < 0) ptr2 = NULL; if( ptr2==NULL ) { // No port is given // Look if a path is given if( ptr3==NULL ) { // No path/filename // So we have an URL like http://www.hostname.com pos2 = strlen(escfilename); } else { // We have an URL like http://www.hostname.com/file.txt pos2 = ptr3-escfilename; } } else { // We have an URL beginning like http://www.hostname.com:1212 // Get the port number Curl->port = atoi(ptr2+1); pos2 = ptr2-escfilename; } if( v6addr ) pos2--; // copy the hostname in the URL container Curl->hostname = malloc(pos2-pos1+1); if( Curl->hostname==NULL ) { mp_msg(MSGT_NETWORK,MSGL_FATAL,MSGTR_MemAllocFailed); goto err_out; } strncpy(Curl->hostname, ptr1, pos2-pos1); Curl->hostname[pos2-pos1] = '\0'; // Look if a path is given ptr2 = strstr(ptr1, "/"); if( ptr2!=NULL ) { // A path/filename is given // check if it's not a trailing '/' if( strlen(ptr2)>1 ) { // copy the path/filename in the URL container Curl->file = strdup(ptr2); if( Curl->file==NULL ) { mp_msg(MSGT_NETWORK,MSGL_FATAL,MSGTR_MemAllocFailed); goto err_out; } } } // Check if a filename was given or set, else set it with '/' if( Curl->file==NULL ) { Curl->file = malloc(2); if( Curl->file==NULL ) { mp_msg(MSGT_NETWORK,MSGL_FATAL,MSGTR_MemAllocFailed); goto err_out; } strcpy(Curl->file, "/"); } free(escfilename); return Curl; err_out: if (escfilename) free(escfilename); if (Curl) url_free(Curl); return NULL; } void url_free(URL_t* url) { if(!url) return; if(url->url) free(url->url); if(url->protocol) free(url->protocol); if(url->hostname) free(url->hostname); if(url->file) free(url->file); if(url->username) free(url->username); if(url->password) free(url->password); free(url); } /* Replace escape sequences in an URL (or a part of an URL) */ /* works like strcpy(), but without return argument */ void url_unescape_string(char *outbuf, const char *inbuf) { unsigned char c,c1,c2; int i,len=strlen(inbuf); for (i=0;i<len;i++){ c = inbuf[i]; if (c == '%' && i<len-2) { //must have 2 more chars c1 = toupper(inbuf[i+1]); // we need uppercase characters c2 = toupper(inbuf[i+2]); if ( ((c1>='0' && c1<='9') || (c1>='A' && c1<='F')) && ((c2>='0' && c2<='9') || (c2>='A' && c2<='F')) ) { if (c1>='0' && c1<='9') c1-='0'; else c1-='A'-10; if (c2>='0' && c2<='9') c2-='0'; else c2-='A'-10; c = (c1<<4) + c2; i=i+2; //only skip next 2 chars if valid esc } } *outbuf++ = c; } *outbuf++='\0'; //add nullterm to string } static void url_escape_string_part(char *outbuf, const char *inbuf) { unsigned char c,c1,c2; int i,len=strlen(inbuf); for (i=0;i<len;i++) { c = inbuf[i]; if ((c=='%') && i<len-2 ) { //need 2 more characters c1=toupper(inbuf[i+1]); c2=toupper(inbuf[i+2]); // need uppercase chars } else { c1=129; c2=129; //not escape chars } if( (c >= 'A' && c <= 'Z') || (c >= 'a' && c <= 'z') || (c >= '0' && c <= '9') || (c >= 0x7f)) { *outbuf++ = c; } else if ( c=='%' && ((c1 >= '0' && c1 <= '9') || (c1 >= 'A' && c1 <= 'F')) && ((c2 >= '0' && c2 <= '9') || (c2 >= 'A' && c2 <= 'F'))) { // check if part of an escape sequence *outbuf++=c; // already // dont escape again mp_msg(MSGT_NETWORK,MSGL_ERR,MSGTR_MPDEMUX_URL_StringAlreadyEscaped,c,c1,c2); // error as this should not happen against RFC 2396 // to escape a string twice } else { /* all others will be escaped */ c1 = ((c & 0xf0) >> 4); c2 = (c & 0x0f); if (c1 < 10) c1+='0'; else c1+='A'-10; if (c2 < 10) c2+='0'; else c2+='A'-10; *outbuf++ = '%'; *outbuf++ = c1; *outbuf++ = c2; } } *outbuf++='\0'; } /* Replace specific characters in the URL string by an escape sequence */ /* works like strcpy(), but without return argument */ void url_escape_string(char *outbuf, const char *inbuf) { unsigned char c; int i = 0,j,len = strlen(inbuf); char* tmp,*unesc = NULL, *in; // Look if we have an ip6 address, if so skip it there is // no need to escape anything in there. tmp = strstr(inbuf,"://["); if(tmp) { tmp = strchr(tmp+4,']'); if(tmp && (tmp[1] == '/' || tmp[1] == ':' || tmp[1] == '\0')) { i = tmp+1-inbuf; strncpy(outbuf,inbuf,i); outbuf += i; tmp = NULL; } } tmp = NULL; while(i < len) { // look for the next char that must be kept for (j=i;j<len;j++) { c = inbuf[j]; if(c=='-' || c=='_' || c=='.' || c=='!' || c=='~' || /* mark characters */ c=='*' || c=='\'' || c=='(' || c==')' || /* do not touch escape character */ c==';' || c=='/' || c=='?' || c==':' || c=='@' || /* reserved characters */ c=='&' || c=='=' || c=='+' || c=='$' || c==',') /* see RFC 2396 */ break; } // we are on a reserved char, write it out if(j == i) { *outbuf++ = c; i++; continue; } // we found one, take that part of the string if(j < len) { if(!tmp) tmp = malloc(len+1); strncpy(tmp,inbuf+i,j-i); tmp[j-i] = '\0'; in = tmp; } else // take the rest of the string in = (char*)inbuf+i; if(!unesc) unesc = malloc(len+1); // unescape first to avoid escaping escape url_unescape_string(unesc,in); // then escape, including mark and other reserved chars // that can come from escape sequences url_escape_string_part(outbuf,unesc); outbuf += strlen(outbuf); i += strlen(in); } *outbuf = '\0'; if(tmp) free(tmp); if(unesc) free(unesc); } #ifdef URL_DEBUG void url_debug(const URL_t *url) { if( url==NULL ) { printf("URL pointer NULL\n"); return; } if( url->url!=NULL ) { printf("url=%s\n", url->url ); } if( url->protocol!=NULL ) { printf("protocol=%s\n", url->protocol ); } if( url->hostname!=NULL ) { printf("hostname=%s\n", url->hostname ); } printf("port=%d\n", url->port ); if( url->file!=NULL ) { printf("file=%s\n", url->file ); } if( url->username!=NULL ) { printf("username=%s\n", url->username ); } if( url->password!=NULL ) { printf("password=%s\n", url->password ); } } #endif /* URL_DEBUG */