Mercurial > mplayer.hg
annotate subreader.c @ 2444:ec8ff6ea4af6
Independed compilation of SUBDIRS
author | nick |
---|---|
date | Wed, 24 Oct 2001 07:34:41 +0000 |
parents | 8b971caf9e03 |
children | 7ef89d9b06ed |
rev | line source |
---|---|
258 | 1 /* |
2 * Subtitle reader with format autodetection | |
3 * | |
4 * Written by laaz | |
5 * Some code cleanup & realloc() by A'rpi/ESP-team | |
1081 | 6 * dunnowhat sub format by szabi |
258 | 7 */ |
8 | |
9 | |
10 #include <stdio.h> | |
11 #include <stdlib.h> | |
12 #include <string.h> | |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
13 #include <ctype.h> |
258 | 14 |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
15 #include "config.h" |
258 | 16 #include "subreader.h" |
17 | |
18 #define ERR (void *)-1 | |
19 | |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
20 #ifdef USE_ICONV |
2358 | 21 #ifdef __FreeBSD__ |
22 #include <giconv.h> | |
23 #else | |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
24 #include <iconv.h> |
2358 | 25 #endif |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
26 char *sub_cp=NULL; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
27 #endif |
258 | 28 |
2177 | 29 |
2178 | 30 static float mpsub_position=0; |
2177 | 31 |
258 | 32 int sub_uses_time=0; |
33 int sub_errs=0; | |
624 | 34 int sub_num=0; // number of subtitle structs |
35 int sub_format=-1; // 0 for microdvd | |
36 // 1 for SubRip | |
921 | 37 // 2 for SubViewer |
624 | 38 // 3 for SAMI (smi) |
818 | 39 // 4 for vplayer format |
850 | 40 // 5 for RT format |
921 | 41 // 6 for ssa (Sub Station Alpha) |
1081 | 42 // 7 for ... erm ... dunnowhat. tell me if you know |
2177 | 43 // 8 for the glorious MPsub |
2343 | 44 // 9 for AQTitle |
624 | 45 |
46 int eol(char p) { | |
47 return (p=='\r' || p=='\n' || p=='\0'); | |
48 } | |
49 | |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
50 static inline void trail_space(char *s) { |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
51 int i; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
52 while (isspace(*s)) strcpy(s, s + 1); |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
53 i = strlen(s) - 1; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
54 while (i > 0 && isspace(s[i])) s[i--] = '\0'; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
55 } |
624 | 56 |
2343 | 57 |
624 | 58 subtitle *sub_read_line_sami(FILE *fd, subtitle *current) { |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
59 static char line[1001]; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
60 static char *s = NULL; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
61 char text[1000], *p, *q; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
62 int state; |
624 | 63 |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
64 current->lines = current->start = current->end = 0; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
65 state = 0; |
624 | 66 |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
67 /* read the first line */ |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
68 if (!s) |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
69 if (!(s = fgets(line, 1000, fd))) return 0; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
70 |
624 | 71 do { |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
72 switch (state) { |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
73 |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
74 case 0: /* find "START=" */ |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
75 s = strstr (s, "Start="); |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
76 if (s) { |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
77 current->start = strtol (s + 6, &s, 0) / 10; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
78 state = 1; continue; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
79 } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
80 break; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
81 |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
82 case 1: /* find "<P" */ |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
83 if ((s = strstr (s, "<P"))) { s += 2; state = 2; continue; } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
84 break; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
85 |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
86 case 2: /* find ">" */ |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
87 if ((s = strchr (s, '>'))) { s++; state = 3; p = text; continue; } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
88 break; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
89 |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
90 case 3: /* get all text until '<' appears */ |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
91 if (*s == '\0') { break; } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
92 else if (*s == '<') { state = 4; } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
93 else if (!strncasecmp (s, " ", 6)) { *p++ = ' '; s += 6; } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
94 else if (*s == '\r') { s++; } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
95 else if (!strncasecmp (s, "<br>", 4) || *s == '\n') { |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
96 *p = '\0'; p = text; trail_space (text); |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
97 if (text[0] != '\0') |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
98 current->text[current->lines++] = strdup (text); |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
99 if (*s == '\n') s++; else s += 4; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
100 } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
101 else *p++ = *s++; |
624 | 102 continue; |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
103 |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
104 case 4: /* get current->end or skip <TAG> */ |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
105 q = strstr (s, "Start="); |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
106 if (q) { |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
107 current->end = strtol (q + 6, &q, 0) / 10 - 1; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
108 *p = '\0'; trail_space (text); |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
109 if (text[0] != '\0') |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
110 current->text[current->lines++] = strdup (text); |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
111 if (current->lines > 0) { state = 99; break; } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
112 state = 0; continue; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
113 } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
114 s = strchr (s, '>'); |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
115 if (s) { s++; state = 3; continue; } |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
116 break; |
624 | 117 } |
118 | |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
119 /* read next line */ |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
120 if (state != 99 && !(s = fgets (line, 1000, fd))) return 0; |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
121 |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
122 } while (state != 99); |
624 | 123 |
124 return current; | |
125 } | |
258 | 126 |
127 | |
128 char *sub_readtext(char *source, char **dest) { | |
129 int len=0; | |
932 | 130 char *p=source; |
258 | 131 |
932 | 132 while ( !eol(*p) && *p!= '|' ) { |
133 p++,len++; | |
134 } | |
258 | 135 |
136 *dest= (char *)malloc (len+1); | |
137 if (!dest) {return ERR;} | |
138 | |
139 strncpy(*dest, source, len); | |
140 (*dest)[len]=0; | |
141 | |
142 while (*p=='\r' || *p=='\n' || *p=='|') p++; | |
143 | |
144 if (*p) return p; // not-last text field | |
145 else return NULL; // last text field | |
146 } | |
147 | |
148 subtitle *sub_read_line_microdvd(FILE *fd,subtitle *current) { | |
149 char line[1001]; | |
150 char line2[1001]; | |
151 char *p, *next; | |
152 int i; | |
153 | |
1764 | 154 bzero (current, sizeof(subtitle)); |
258 | 155 |
156 do { | |
157 if (!fgets (line, 1000, fd)) return NULL; | |
932 | 158 } while (sscanf (line, "{%ld}{%ld}%[^\r\n]", &(current->start), &(current->end),line2) <3); |
258 | 159 |
932 | 160 p=line2; |
258 | 161 |
162 next=p, i=0; | |
1081 | 163 while ((next =sub_readtext (next, &(current->text[i])))) { |
270 | 164 if (current->text[i]==ERR) {return ERR;} |
258 | 165 i++; |
1081 | 166 if (i>=SUB_MAX_TEXT) { printf ("Too many lines in a subtitle\n");current->lines=i;return current;} |
258 | 167 } |
932 | 168 current->lines= ++i; |
258 | 169 |
170 return current; | |
171 } | |
172 | |
173 subtitle *sub_read_line_subrip(FILE *fd, subtitle *current) { | |
174 char line[1001]; | |
175 int a1,a2,a3,a4,b1,b2,b3,b4; | |
176 char *p=NULL, *q=NULL; | |
177 int len; | |
178 | |
1764 | 179 bzero (current, sizeof(subtitle)); |
258 | 180 |
1764 | 181 while (1) { |
258 | 182 if (!fgets (line, 1000, fd)) return NULL; |
269 | 183 if (sscanf (line, "%d:%d:%d.%d,%d:%d:%d.%d",&a1,&a2,&a3,&a4,&b1,&b2,&b3,&b4) < 8) continue; |
258 | 184 current->start = a1*360000+a2*6000+a3*100+a4; |
185 current->end = b1*360000+b2*6000+b3*100+b4; | |
186 | |
187 if (!fgets (line, 1000, fd)) return NULL; | |
188 | |
189 p=q=line; | |
190 for (current->lines=1; current->lines < SUB_MAX_TEXT; current->lines++) { | |
191 for (q=p,len=0; *p && *p!='\r' && *p!='\n' && strncmp(p,"[br]",4); p++,len++); | |
192 current->text[current->lines-1]=(char *)malloc (len+1); | |
193 if (!current->text[current->lines-1]) return ERR; | |
194 strncpy (current->text[current->lines-1], q, len); | |
270 | 195 current->text[current->lines-1][len]='\0'; |
258 | 196 if (!*p || *p=='\r' || *p=='\n') break; |
197 while (*p++!=']'); | |
198 } | |
1764 | 199 break; |
258 | 200 } |
201 return current; | |
202 } | |
203 | |
204 subtitle *sub_read_line_third(FILE *fd,subtitle *current) { | |
205 char line[1001]; | |
206 int a1,a2,a3,a4,b1,b2,b3,b4; | |
207 char *p=NULL; | |
208 int i,len; | |
209 | |
1764 | 210 bzero (current, sizeof(subtitle)); |
258 | 211 |
212 while (!current->text[0]) { | |
213 if (!fgets (line, 1000, fd)) return NULL; | |
269 | 214 if ((len=sscanf (line, "%d:%d:%d,%d --> %d:%d:%d,%d",&a1,&a2,&a3,&a4,&b1,&b2,&b3,&b4)) < 8) |
258 | 215 continue; |
216 current->start = a1*360000+a2*6000+a3*100+a4/10; | |
217 current->end = b1*360000+b2*6000+b3*100+b4/10; | |
218 for (i=0; i<SUB_MAX_TEXT;) { | |
269 | 219 if (!fgets (line, 1000, fd)) break; |
258 | 220 len=0; |
221 for (p=line; *p!='\n' && *p!='\r' && *p; p++,len++); | |
222 if (len) { | |
223 current->text[i]=(char *)malloc (len+1); | |
224 if (!current->text[i]) return ERR; | |
270 | 225 strncpy (current->text[i], line, len); current->text[i][len]='\0'; |
258 | 226 i++; |
227 } else { | |
228 break; | |
229 } | |
230 } | |
231 current->lines=i; | |
232 } | |
233 return current; | |
234 } | |
235 | |
818 | 236 subtitle *sub_read_line_vplayer(FILE *fd,subtitle *current) { |
237 char line[1001]; | |
238 char line2[1001]; | |
239 int a1,a2,a3,b1,b2,b3; | |
1081 | 240 char *p=NULL, *next; |
858 | 241 int i,len,len2,plen; |
818 | 242 |
1764 | 243 bzero (current, sizeof(subtitle)); |
818 | 244 |
245 while (!current->text[0]) { | |
246 if (!fgets (line, 1000, fd)) return NULL; | |
858 | 247 if ((len=sscanf (line, "%d:%d:%d:%n",&a1,&a2,&a3,&plen)) < 3) |
818 | 248 continue; |
249 if (!fgets (line2, 1000, fd)) return NULL; | |
250 if ((len2=sscanf (line2, "%d:%d:%d:",&b1,&b2,&b3)) < 3) | |
251 continue; | |
252 // przewiñ o linijkê do ty³u: | |
253 fseek(fd,-strlen(line2),SEEK_CUR); | |
254 | |
255 current->start = a1*360000+a2*6000+a3*100; | |
256 current->end = b1*360000+b2*6000+b3*100; | |
896
d46de26aef48
there is another format that get detected as vplayers.
eyck
parents:
892
diff
changeset
|
257 if ((current->end - current->start) > 1000) {current->end = current->start + 1000;} // not too long though. |
818 | 258 // teraz czas na wkopiowanie stringu |
1640
cbedcfab877b
Fixup to vplayer subtitle submitted to sourceforge by Igor Wojnicki
eyck
parents:
1501
diff
changeset
|
259 p=line; |
cbedcfab877b
Fixup to vplayer subtitle submitted to sourceforge by Igor Wojnicki
eyck
parents:
1501
diff
changeset
|
260 // finds the body of the subtitle |
cbedcfab877b
Fixup to vplayer subtitle submitted to sourceforge by Igor Wojnicki
eyck
parents:
1501
diff
changeset
|
261 for (i=0; i<3; i++){ |
cbedcfab877b
Fixup to vplayer subtitle submitted to sourceforge by Igor Wojnicki
eyck
parents:
1501
diff
changeset
|
262 p=strchr(p,':')+1; |
cbedcfab877b
Fixup to vplayer subtitle submitted to sourceforge by Igor Wojnicki
eyck
parents:
1501
diff
changeset
|
263 } |
cbedcfab877b
Fixup to vplayer subtitle submitted to sourceforge by Igor Wojnicki
eyck
parents:
1501
diff
changeset
|
264 i=0; |
cbedcfab877b
Fixup to vplayer subtitle submitted to sourceforge by Igor Wojnicki
eyck
parents:
1501
diff
changeset
|
265 |
818 | 266 if (*p!='|') { |
267 // | |
268 next = p,i=0; | |
269 while ((next =sub_readtext (next, &(current->text[i])))) { | |
270 if (current->text[i]==ERR) {return ERR;} | |
271 i++; | |
1081 | 272 if (i>=SUB_MAX_TEXT) { printf ("Too many lines in a subtitle\n");current->lines=i;return current;} |
818 | 273 } |
274 current->lines=i+1; | |
275 } | |
276 } | |
277 return current; | |
278 } | |
279 | |
850 | 280 subtitle *sub_read_line_rt(FILE *fd,subtitle *current) { |
281 //TODO: This format uses quite rich (sub/super)set of xhtml | |
282 // I couldn't check it since DTD is not included. | |
283 // WARNING: full XML parses can be required for proper parsing | |
284 char line[1001]; | |
285 int a1,a2,a3,a4,b1,b2,b3,b4; | |
286 char *p=NULL,*next=NULL; | |
287 int i,len,plen; | |
288 | |
1764 | 289 bzero (current, sizeof(subtitle)); |
850 | 290 |
291 while (!current->text[0]) { | |
292 if (!fgets (line, 1000, fd)) return NULL; | |
293 //TODO: it seems that format of time is not easily determined, it may be 1:12, 1:12.0 or 0:1:12.0 | |
294 //to describe the same moment in time. Maybe there are even more formats in use. | |
295 //if ((len=sscanf (line, "<Time Begin=\"%d:%d:%d.%d\" End=\"%d:%d:%d.%d\"",&a1,&a2,&a3,&a4,&b1,&b2,&b3,&b4)) < 8) | |
296 plen=a1=a2=a3=a4=b1=b2=b3=b4=0; | |
297 if ( | |
298 ((len=sscanf (line, "<%*[tT]ime %*[bB]egin=\"%d:%d\" %*[Ee]nd=\"%d:%d\"%*[^<]<clear/>%n",&a2,&a3,&b2,&b3,&plen)) < 4) && | |
299 ((len=sscanf (line, "<%*[tT]ime %*[bB]egin=\"%d:%d\" %*[Ee]nd=\"%d:%d.%d\"%*[^<]<clear/>%n",&a2,&a3,&b2,&b3,&b4,&plen)) < 5) && | |
300 // ((len=sscanf (line, "<%*[tT]ime %*[bB]egin=\"%d:%d.%d\" %*[Ee]nd=\"%d:%d\"%*[^<]<clear/>%n",&a2,&a3,&a4,&b2,&b3,&plen)) < 5) && | |
301 ((len=sscanf (line, "<%*[tT]ime %*[bB]egin=\"%d:%d.%d\" %*[Ee]nd=\"%d:%d.%d\"%*[^<]<clear/>%n",&a2,&a3,&a4,&b2,&b3,&b4,&plen)) < 6) && | |
302 ((len=sscanf (line, "<%*[tT]ime %*[bB]egin=\"%d:%d:%d.%d\" %*[Ee]nd=\"%d:%d:%d.%d\"%*[^<]<clear/>%n",&a1,&a2,&a3,&a4,&b1,&b2,&b3,&b4,&plen)) < 8) | |
303 ) | |
304 continue; | |
305 current->start = a1*360000+a2*6000+a3*100+a4/10; | |
306 current->end = b1*360000+b2*6000+b3*100+b4/10; | |
307 p=line; p+=plen;i=0; | |
308 // TODO: I don't know what kind of convention is here for marking multiline subs, maybe <br/> like in xml? | |
309 next = strstr(line,"<clear/>")+8;i=0; | |
310 while ((next =sub_readtext (next, &(current->text[i])))) { | |
311 if (current->text[i]==ERR) {return ERR;} | |
312 i++; | |
1081 | 313 if (i>=SUB_MAX_TEXT) { printf ("Too many lines in a subtitle\n");current->lines=i;return current;} |
850 | 314 } |
315 current->lines=i+1; | |
316 } | |
317 return current; | |
318 } | |
319 | |
921 | 320 subtitle *sub_read_line_ssa(FILE *fd,subtitle *current) { |
321 int hour1, min1, sec1, hunsec1, | |
322 hour2, min2, sec2, hunsec2, nothing; | |
2141 | 323 int num; |
921 | 324 |
325 char line[1000], | |
2140 | 326 line3[1000], |
327 *line2; | |
2141 | 328 char *tmp; |
329 | |
921 | 330 do { |
331 if (!fgets (line, 1000, fd)) return NULL; | |
332 } while (sscanf (line, "Dialogue: Marked=%d,%d:%d:%d.%d,%d:%d:%d.%d," | |
2140 | 333 "%[^\n\r]", ¬hing, |
334 &hour1, &min1, &sec1, &hunsec1, | |
335 &hour2, &min2, &sec2, &hunsec2, | |
336 line3) < 9); | |
337 line2=strstr(line3,",,"); | |
338 if (!line2) return NULL; | |
339 line2 ++; | |
340 line2 ++; | |
341 | |
2141 | 342 current->lines=1;num=0; |
921 | 343 current->start = 360000*hour1 + 6000*min1 + 100*sec1 + hunsec1; |
344 current->end = 360000*hour2 + 6000*min2 + 100*sec2 + hunsec2; | |
2141 | 345 |
346 while (tmp=strstr(line2, "\\n")) { | |
347 current->text[num]=(char *)malloc(tmp-line2+1); | |
348 strncpy (current->text[num], line2, tmp-line2); | |
349 current->text[num][tmp-line2]='\0'; | |
350 line2=tmp+2; | |
351 num++; | |
352 current->lines++; | |
353 if (current->lines >= SUB_MAX_TEXT) return current; | |
354 } | |
355 | |
356 | |
357 current->text[num]=(char *) malloc(strlen(line2)+1); | |
358 strcpy(current->text[num],line2); | |
818 | 359 |
921 | 360 return current; |
361 } | |
258 | 362 |
1081 | 363 subtitle *sub_read_line_dunnowhat(FILE *fd,subtitle *current) { |
364 char line[1001]; | |
365 char text[1001]; | |
366 | |
1764 | 367 bzero (current, sizeof(subtitle)); |
1081 | 368 |
369 if (!fgets (line, 1000, fd)) | |
370 return NULL; | |
371 if (sscanf (line, "%ld,%ld,\"%[^\"]", &(current->start), | |
372 &(current->end), text) <3) | |
373 return ERR; | |
374 current->text[0] = strdup(text); | |
375 current->lines = 1; | |
376 | |
377 return current; | |
378 } | |
379 | |
2177 | 380 subtitle *sub_read_line_mpsub(FILE *fd, subtitle *current) { |
381 char line[1000]; | |
2178 | 382 float a,b; |
383 int num=0; | |
2177 | 384 char *p, *q; |
385 | |
386 do | |
387 { | |
388 if (!fgets(line, 1000, fd)) return NULL; | |
2178 | 389 } while (sscanf (line, "%f %f", &a, &b) !=2); |
2177 | 390 |
2178 | 391 mpsub_position += (a*100.0); |
392 current->start=(int) mpsub_position; | |
393 mpsub_position += (b*100.0); | |
394 current->end=(int) mpsub_position; | |
2177 | 395 |
396 while (num < SUB_MAX_TEXT) { | |
397 if (!fgets (line, 1000, fd)) return NULL; | |
398 p=line; | |
399 while (isspace(*p)) p++; | |
400 if (eol(*p) && num > 0) return current; | |
401 if (eol(*p)) return NULL; | |
402 | |
403 for (q=p; !eol(*q); q++); | |
404 *q='\0'; | |
405 if (strlen(p)) { | |
406 current->text[num]=strdup(p); | |
407 current->lines = ++num; | |
408 } else { | |
409 if (num) return current; | |
410 else return NULL; | |
411 } | |
412 } | |
413 } | |
414 | |
2343 | 415 subtitle *previous_aqt_sub = NULL; |
416 | |
417 subtitle *sub_read_line_aqt(FILE *fd,subtitle *current) { | |
418 char line[1001]; | |
419 | |
420 bzero (current, sizeof(subtitle)); | |
421 | |
422 while (1) { | |
423 // try to locate next subtitle | |
424 if (!fgets (line, 1000, fd)) | |
425 return NULL; | |
426 if (!(sscanf (line, "-->> %ld", &(current->start)) <1)) | |
427 break; | |
428 } | |
429 | |
430 if (previous_aqt_sub != NULL) | |
431 previous_aqt_sub->end = current->start-1; | |
432 | |
433 previous_aqt_sub = current; | |
434 | |
435 if (!fgets (line, 1000, fd)) | |
436 return NULL; | |
437 | |
438 sub_readtext(&line,¤t->text[0]); | |
439 current->lines = 1; | |
440 current->end = current->start; // will be corrected by next subtitle | |
441 | |
442 if (!fgets (line, 1000, fd)) | |
443 return current;; | |
444 | |
445 sub_readtext(&line,¤t->text[1]); | |
446 current->lines = 2; | |
447 | |
448 if ((current->text[0]=="") && (current->text[1]=="")) { | |
449 // void subtitle -> end of previous marked and exit | |
450 previous_aqt_sub = NULL; | |
451 return NULL; | |
452 } | |
453 | |
454 return current; | |
455 } | |
2177 | 456 |
258 | 457 int sub_autodetect (FILE *fd) { |
458 char line[1001]; | |
459 int i,j=0; | |
2177 | 460 char p; |
258 | 461 |
624 | 462 while (j < 100) { |
258 | 463 j++; |
464 if (!fgets (line, 1000, fd)) | |
465 return -1; | |
466 | |
624 | 467 if (sscanf (line, "{%d}{%d}", &i, &i)==2) |
258 | 468 {sub_uses_time=0;return 0;} |
269 | 469 if (sscanf (line, "%d:%d:%d.%d,%d:%d:%d.%d", &i, &i, &i, &i, &i, &i, &i, &i)==8) |
258 | 470 {sub_uses_time=1;return 1;} |
269 | 471 if (sscanf (line, "%d:%d:%d,%d --> %d:%d:%d,%d", &i, &i, &i, &i, &i, &i, &i, &i)==8) |
258 | 472 {sub_uses_time=1;return 2;} |
624 | 473 if (strstr (line, "<SAMI>")) |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
474 {sub_uses_time=1; return 3;} |
818 | 475 if (sscanf (line, "%d:%d:%d:", &i, &i, &i )==3) |
476 {sub_uses_time=1;return 4;} | |
850 | 477 //TODO: just checking if first line of sub starts with "<" is WAY |
913
18c43d261c35
corrected strcmp() bug, now it works again with every subs (it was broken)
laaz
parents:
896
diff
changeset
|
478 // too weak test for RT |
18c43d261c35
corrected strcmp() bug, now it works again with every subs (it was broken)
laaz
parents:
896
diff
changeset
|
479 // Please someone who knows the format of RT... FIX IT!!! |
921 | 480 // It may conflict with other sub formats in the future (actually it doesn't) |
913
18c43d261c35
corrected strcmp() bug, now it works again with every subs (it was broken)
laaz
parents:
896
diff
changeset
|
481 if ( *line == '<' ) |
850 | 482 {sub_uses_time=1;return 5;} |
921 | 483 |
484 // I have only seen only 1 piece of .ssa file. | |
485 // It may be not correct (tell me if it's not) | |
486 if (!memcmp(line, "Dialogue: Marked", 16)) | |
487 {sub_uses_time=1; return 6;} | |
1081 | 488 if (sscanf (line, "%d,%d,\"%c", &i, &i, (char *) &i) == 3) |
489 {sub_uses_time=0;return 7;} | |
2177 | 490 if (sscanf (line, "FORMAT=%d", &i) == 1) |
491 {sub_uses_time=0; return 8;} | |
492 if (sscanf (line, "FORMAT=TIM%c", &p)==1 && p=='E') | |
493 {sub_uses_time=1; return 8;} | |
2343 | 494 if (strstr (line, "-->>")) |
495 {sub_uses_time=0; return 9;} | |
258 | 496 } |
624 | 497 |
498 return -1; // too many bad lines | |
258 | 499 } |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
500 |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
501 extern int sub_utf8; |
258 | 502 |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
503 #ifdef USE_ICONV |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
504 static iconv_t icdsc; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
505 |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
506 void subcp_open (void) |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
507 { |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
508 char *tocp = "UTF-8"; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
509 icdsc = (iconv_t)(-1); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
510 if (sub_cp){ |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
511 if ((icdsc = iconv_open (tocp, sub_cp)) != (iconv_t)(-1)){ |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
512 printf ("SUB: opened iconv descriptor.\n"); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
513 sub_utf8 = 2; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
514 } else |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
515 printf ("SUB: error opening iconv descriptor.\n"); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
516 } |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
517 } |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
518 |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
519 void subcp_close (void) |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
520 { |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
521 if (icdsc != (iconv_t)(-1)){ |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
522 (void) iconv_close (icdsc); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
523 printf ("SUB: closed iconv descriptor.\n"); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
524 } |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
525 } |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
526 |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
527 #define ICBUFFSIZE 512 |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
528 static char icbuffer[ICBUFFSIZE]; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
529 |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
530 subtitle* subcp_recode (subtitle *sub) |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
531 { |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
532 int l=sub->lines; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
533 size_t ileft, oleft, otlen; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
534 char *op, *ip, *ot; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
535 |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
536 while (l){ |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
537 op = icbuffer; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
538 ip = sub->text[--l]; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
539 ileft = strlen(ip); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
540 oleft = ICBUFFSIZE - 1; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
541 |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
542 if (iconv(icdsc, (const char **) &ip, &ileft, |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
543 &op, &oleft) == (size_t)(-1)) { |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
544 printf ("SUB: error recoding line.\n"); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
545 l++; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
546 break; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
547 } |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
548 if (!(ot = (char *)malloc(op - icbuffer + 1))){ |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
549 printf ("SUB: error allocating mem.\n"); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
550 l++; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
551 break; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
552 } |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
553 *op='\0' ; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
554 strcpy (ot, icbuffer); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
555 free (sub->text[l]); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
556 sub->text[l] = ot; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
557 } |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
558 if (l){ |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
559 for (l = sub->lines; l;) |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
560 free (sub->text[--l]); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
561 return ERR; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
562 } |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
563 return sub; |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
564 } |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
565 |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
566 #endif |
258 | 567 |
568 subtitle* sub_read_file (char *filename) { | |
569 FILE *fd; | |
570 int n_max; | |
571 subtitle *first; | |
1081 | 572 subtitle * (*func[])(FILE *fd,subtitle *dest)= |
258 | 573 { |
574 sub_read_line_microdvd, | |
575 sub_read_line_subrip, | |
624 | 576 sub_read_line_third, |
818 | 577 sub_read_line_sami, |
850 | 578 sub_read_line_vplayer, |
921 | 579 sub_read_line_rt, |
1081 | 580 sub_read_line_ssa, |
2177 | 581 sub_read_line_dunnowhat, |
2343 | 582 sub_read_line_mpsub, |
583 sub_read_line_aqt | |
584 | |
258 | 585 }; |
586 | |
587 fd=fopen (filename, "r"); if (!fd) return NULL; | |
588 | |
589 sub_format=sub_autodetect (fd); | |
590 if (sub_format==-1) {printf ("SUB: Could not determine file format\n");return NULL;} | |
624 | 591 printf ("SUB: Detected subtitle file format: %d\n",sub_format); |
258 | 592 |
593 rewind (fd); | |
594 | |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
595 #ifdef USE_ICONV |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
596 subcp_open(); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
597 #endif |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
598 |
258 | 599 sub_num=0;n_max=32; |
600 first=(subtitle *)malloc(n_max*sizeof(subtitle)); | |
601 if(!first) return NULL; | |
602 | |
603 while(1){ | |
604 subtitle *sub; | |
605 if(sub_num>=n_max){ | |
606 n_max+=16; | |
607 first=realloc(first,n_max*sizeof(subtitle)); | |
608 } | |
609 sub=func[sub_format](fd,&first[sub_num]); | |
610 if(!sub) break; // EOF | |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
611 #ifdef USE_ICONV |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
612 if ((sub!=ERR) && (sub_utf8 & 2)) sub=subcp_recode(sub); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
613 #endif |
258 | 614 if(sub==ERR) ++sub_errs; else ++sub_num; // Error vs. Valid |
615 } | |
616 | |
617 fclose(fd); | |
618 | |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
619 #ifdef USE_ICONV |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
620 subcp_close(); |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
621 #endif |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
622 |
258 | 623 // printf ("SUB: Subtitle format %s time.\n", sub_uses_time?"uses":"doesn't use"); |
269 | 624 printf ("SUB: Read %i subtitles", sub_num); |
624 | 625 if (sub_errs) printf (", %i bad line(s).\n", sub_errs); |
269 | 626 else printf (".\n"); |
258 | 627 |
628 return first; | |
629 } | |
630 | |
892 | 631 #if 0 |
509 | 632 char * strreplace( char * in,char * what,char * whereof ) |
633 { | |
634 int i; | |
635 char * tmp; | |
636 | |
637 if ( ( in == NULL )||( what == NULL )||( whereof == NULL )||( ( tmp=strstr( in,what ) ) == NULL ) ) return NULL; | |
638 for( i=0;i<strlen( whereof );i++ ) tmp[i]=whereof[i]; | |
639 if ( strlen( what ) > strlen( whereof ) ) tmp[i]=0; | |
640 return in; | |
641 } | |
892 | 642 #endif |
509 | 643 |
892 | 644 char * sub_filename(char* path, char * fname ) |
509 | 645 { |
892 | 646 char * sub_name1; |
647 char * sub_name2; | |
934
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
648 char * aviptr1, * aviptr2, * tmp; |
892 | 649 int i,j; |
650 FILE * f; | |
651 int pos=0; | |
652 char * sub_exts[] = | |
1501
d40f2b686846
changes according to -utf8 option, draw_osd() function added
atlka
parents:
1081
diff
changeset
|
653 { ".utf", |
d40f2b686846
changes according to -utf8 option, draw_osd() function added
atlka
parents:
1081
diff
changeset
|
654 ".UTF", |
d40f2b686846
changes according to -utf8 option, draw_osd() function added
atlka
parents:
1081
diff
changeset
|
655 ".sub", |
509 | 656 ".SUB", |
657 ".srt", | |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
658 ".SRT", |
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
659 ".smi", |
850 | 660 ".SMI", |
661 ".rt", | |
662 ".RT", | |
663 ".txt", | |
1081 | 664 ".TXT", |
665 ".ssa", | |
2343 | 666 ".SSA", |
667 ".aqt", | |
668 ".AQT"}; | |
892 | 669 |
934
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
670 |
509 | 671 if ( fname == NULL ) return NULL; |
892 | 672 |
673 sub_name1=strrchr(fname,'.'); | |
674 if (!sub_name1) return NULL; | |
675 pos=sub_name1-fname; | |
676 | |
934
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
677 sub_name1=malloc(strlen(fname)+8); |
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
678 strcpy(sub_name1,fname); |
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
679 |
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
680 sub_name2=malloc (strlen(path) + strlen(fname) + 8); |
1081 | 681 if ((tmp=strrchr(fname,'/'))) |
934
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
682 sprintf (sub_name2, "%s%s", path, tmp+1); |
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
683 else |
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
684 sprintf (sub_name2, "%s%s", path, fname); |
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
685 |
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
686 aviptr1=strrchr(sub_name1,'.'); |
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
687 aviptr2=strrchr(sub_name2,'.'); |
892 | 688 |
689 for(j=0;j<=1;j++){ | |
690 char* sub_name=j?sub_name1:sub_name2; | |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
691 #ifdef USE_ICONV |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
692 for ( i=(sub_cp?2:0);i<(sizeof(sub_exts)/sizeof(char*));i++ ) { |
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
693 #else |
892 | 694 for ( i=0;i<(sizeof(sub_exts)/sizeof(char*));i++ ) { |
2151
a9d91476085a
modifications to use iconv(3) function to recode text of subs (autodetect)
atlka
parents:
2141
diff
changeset
|
695 #endif |
934
b2c7c4b49948
Gabucino (CGA user)'s request (finds default.subs well)
laaz
parents:
932
diff
changeset
|
696 strcpy(j?aviptr1:aviptr2,sub_exts[i]); |
935 | 697 // printf("trying: '%s'\n",sub_name); |
892 | 698 if((f=fopen( sub_name,"rt" ))) { |
509 | 699 fclose( f ); |
700 printf( "SUB: Detected sub file: %s\n",sub_name ); | |
1501
d40f2b686846
changes according to -utf8 option, draw_osd() function added
atlka
parents:
1081
diff
changeset
|
701 if (i<2) sub_utf8=1; |
509 | 702 return sub_name; |
892 | 703 } |
509 | 704 } |
892 | 705 } |
706 | |
509 | 707 return NULL; |
708 } | |
709 | |
1761 | 710 void list_sub_file(subtitle* subs){ |
711 int i,j; | |
712 | |
713 for(j=0;j<sub_num;j++){ | |
714 subtitle* egysub=&subs[j]; | |
715 printf ("%i line%c (%li-%li) ", | |
716 egysub->lines, | |
717 (1==egysub->lines)?' ':'s', | |
718 egysub->start, | |
719 egysub->end); | |
720 for (i=0; i<egysub->lines; i++) { | |
721 printf ("%s%s",egysub->text[i], i==egysub->lines-1?"":" <BREAK> "); | |
722 } | |
723 printf ("\n"); | |
724 } | |
725 | |
726 printf ("Subtitle format %s time.\n", sub_uses_time?"uses":"doesn't use"); | |
727 printf ("Read %i subtitles, %i errors.\n", sub_num, sub_errs); | |
728 | |
729 } | |
730 | |
2178 | 731 void dump_mpsub(subtitle* subs){ |
732 int i,j; | |
733 FILE *fd; | |
734 float a,b; | |
735 | |
736 mpsub_position=0.0; | |
737 | |
738 fd=fopen ("dump.mpsub", "w"); | |
739 if (!fd) { | |
740 perror ("dump_mpsub: fopen"); | |
741 return; | |
742 } | |
743 | |
744 | |
745 if (sub_uses_time) fprintf (fd,"FORMAT=TIME\n\n"); | |
746 else fprintf (fd, "FORMAT=25"); // FIXME: fps | |
747 | |
748 for(j=0;j<sub_num;j++){ | |
749 subtitle* egysub=&subs[j]; | |
750 a=((egysub->start-mpsub_position)/100.0); | |
751 b=((egysub->end-egysub->start)/100.0); | |
752 if ( (float)((int)a) == a) | |
753 fprintf (fd, "%.0f",a); | |
754 else | |
755 fprintf (fd, "%.2f",a); | |
756 | |
757 if ( (float)((int)b) == b) | |
758 fprintf (fd, " %.0f\n",b); | |
759 else | |
760 fprintf (fd, " %.2f\n",b); | |
761 | |
762 mpsub_position = egysub->end; | |
763 for (i=0; i<egysub->lines; i++) { | |
764 fprintf (fd, "%s\n",egysub->text[i]); | |
765 } | |
766 fprintf (fd, "\n"); | |
767 } | |
768 fclose (fd); | |
769 printf ("Subtitles dumped in \'dump.mpsub\'.\n"); | |
770 } | |
771 | |
772 | |
773 | |
625 | 774 #if 0 |
258 | 775 int main(int argc, char **argv) { // for testing |
776 | |
777 int i,j; | |
778 subtitle *subs; | |
779 subtitle *egysub; | |
780 | |
781 if(argc<2){ | |
782 printf("\nUsage: subreader filename.sub\n\n"); | |
783 exit(1); | |
784 } | |
785 | |
624 | 786 subs=sub_read_file(argv[1]); |
258 | 787 if(!subs){ |
788 printf("Couldn't load file... let's write a bugreport :)\n"); | |
789 exit(1); | |
790 } | |
1761 | 791 |
792 list_sub_file(subs); | |
258 | 793 |
794 return 0; | |
795 } | |
706
8a7666a78f83
better .smi support and display two-byte characters- patch by Sunjin Yang
arpi_esp
parents:
678
diff
changeset
|
796 #endif |