Mercurial > mplayer.hg
annotate libass/ass.c @ 19638:a3473d990fed
Better collision detection algorithm. The idea is to keep a subtitle in place
when a lower placed one disappears, thus improving readability.
As a side effect, layers are supported now.
author | eugeni |
---|---|
date | Sat, 02 Sep 2006 19:17:32 +0000 |
parents | 4a64fecfb425 |
children | bbe600db7b83 |
rev | line source |
---|---|
18937 | 1 #include "config.h" |
2 | |
3 #include <stdio.h> | |
4 #include <stdlib.h> | |
5 #include <string.h> | |
6 #include <assert.h> | |
7 #include <errno.h> | |
8 #include <sys/types.h> | |
9 #include <sys/stat.h> | |
10 #include <unistd.h> | |
19374 | 11 #include <inttypes.h> |
18937 | 12 |
13 #ifdef HAVE_ENCA | |
14 #include "subreader.h" // for guess_buffer_cp | |
15 #endif | |
16 | |
17 #ifdef USE_ICONV | |
18 #include <iconv.h> | |
19 extern char *sub_cp; | |
20 #endif | |
19492 | 21 extern int extract_embedded_fonts; |
19495 | 22 extern char** ass_force_style_list; |
18937 | 23 |
24 #include "mp_msg.h" | |
25 #include "ass.h" | |
26 #include "ass_utils.h" | |
27 #include "libvo/sub.h" // for utf8_get_char | |
28 | |
29 char *get_path(char *); | |
30 | |
19492 | 31 struct parser_priv_s { |
32 enum {PST_UNKNOWN = 0, PST_INFO, PST_STYLES, PST_EVENTS, PST_FONTS} state; | |
33 char* fontname; | |
34 char* fontdata; | |
35 int fontdata_size; | |
36 int fontdata_used; | |
37 }; | |
38 | |
18937 | 39 #define ASS_STYLES_ALLOC 20 |
40 #define ASS_EVENTS_ALLOC 200 | |
41 | |
42 void ass_free_track(ass_track_t* track) { | |
43 int i; | |
44 | |
19492 | 45 if (track->parser_priv) { |
46 if (track->parser_priv->fontname) | |
47 free(track->parser_priv->fontname); | |
48 if (track->parser_priv->fontdata) | |
49 free(track->parser_priv->fontdata); | |
50 free(track->parser_priv); | |
51 } | |
18937 | 52 if (track->style_format) |
53 free(track->style_format); | |
54 if (track->event_format) | |
55 free(track->event_format); | |
56 if (track->styles) { | |
19474
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
57 for (i = 0; i < track->n_styles; ++i) |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
58 ass_free_style(track, i); |
18937 | 59 free(track->styles); |
60 } | |
61 if (track->events) { | |
19474
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
62 for (i = 0; i < track->n_events; ++i) |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
63 ass_free_event(track, i); |
18937 | 64 free(track->events); |
65 } | |
66 } | |
67 | |
68 /// \brief Allocate a new style struct | |
69 /// \param track track | |
70 /// \return style id | |
71 int ass_alloc_style(ass_track_t* track) { | |
72 int sid; | |
73 | |
74 assert(track->n_styles <= track->max_styles); | |
75 | |
76 if (track->n_styles == track->max_styles) { | |
77 track->max_styles += ASS_STYLES_ALLOC; | |
78 track->styles = (ass_style_t*)realloc(track->styles, sizeof(ass_style_t)*track->max_styles); | |
79 } | |
80 | |
81 sid = track->n_styles++; | |
82 memset(track->styles + sid, 0, sizeof(ass_style_t)); | |
83 return sid; | |
84 } | |
85 | |
86 /// \brief Allocate a new event struct | |
87 /// \param track track | |
88 /// \return event id | |
89 int ass_alloc_event(ass_track_t* track) { | |
90 int eid; | |
91 | |
92 assert(track->n_events <= track->max_events); | |
93 | |
94 if (track->n_events == track->max_events) { | |
95 track->max_events += ASS_EVENTS_ALLOC; | |
96 track->events = (ass_event_t*)realloc(track->events, sizeof(ass_event_t)*track->max_events); | |
97 } | |
98 | |
99 eid = track->n_events++; | |
100 memset(track->events + eid, 0, sizeof(ass_event_t)); | |
101 return eid; | |
102 } | |
103 | |
19474
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
104 void ass_free_event(ass_track_t* track, int eid) { |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
105 ass_event_t* event = track->events + eid; |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
106 if (event->Name) |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
107 free(event->Name); |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
108 if (event->Effect) |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
109 free(event->Effect); |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
110 if (event->Text) |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
111 free(event->Text); |
19638
a3473d990fed
Better collision detection algorithm. The idea is to keep a subtitle in place
eugeni
parents:
19635
diff
changeset
|
112 if (event->render_priv) |
a3473d990fed
Better collision detection algorithm. The idea is to keep a subtitle in place
eugeni
parents:
19635
diff
changeset
|
113 free(event->render_priv); |
19474
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
114 } |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
115 |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
116 void ass_free_style(ass_track_t* track, int sid) { |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
117 ass_style_t* style = track->styles + sid; |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
118 if (style->Name) |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
119 free(style->Name); |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
120 if (style->FontName) |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
121 free(style->FontName); |
18937 | 122 } |
123 | |
124 static int events_compare_f(const void* a_, const void* b_) { | |
125 ass_event_t* a = (ass_event_t*)a_; | |
126 ass_event_t* b = (ass_event_t*)b_; | |
127 if (a->Start < b->Start) | |
128 return -1; | |
129 else if (a->Start > b->Start) | |
130 return 1; | |
131 else | |
132 return 0; | |
133 } | |
134 | |
135 /// \brief Sort events by start time | |
136 /// \param tid track id | |
137 static void sort_events(ass_track_t* track) { | |
138 qsort(track->events, track->n_events, sizeof(ass_event_t), events_compare_f); | |
139 } | |
140 | |
141 // ============================================================================================== | |
142 | |
143 static void skip_spaces(char** str) { | |
144 char* p = *str; | |
145 while ((*p==' ') || (*p=='\t')) | |
146 ++p; | |
147 *str = p; | |
148 } | |
149 | |
150 static void rskip_spaces(char** str, char* limit) { | |
151 char* p = *str; | |
152 while ((p >= limit) && ((*p==' ') || (*p=='\t'))) | |
153 --p; | |
154 *str = p; | |
155 } | |
156 | |
157 /** | |
158 * \brief find style by name | |
159 * \param track track | |
160 * \param name style name | |
161 * \return index in track->styles | |
162 * Returnes 0 if no styles found => expects at least 1 style. | |
163 * Parsing code always adds "Default" style in the end. | |
164 */ | |
165 static int lookup_style(ass_track_t* track, char* name) { | |
166 int i; | |
19567 | 167 if (*name == '*') ++name; // FIXME: what does '*' really mean ? |
18937 | 168 for (i=0; i<track->n_styles; ++i) { |
169 // FIXME: mb strcasecmp ? | |
170 if (strcmp(track->styles[i].Name, name) == 0) | |
171 return i; | |
172 } | |
173 i = track->default_style; | |
174 mp_msg(MSGT_GLOBAL, MSGL_WARN, "[%p] Warning: no style named '%s' found, using '%s'\n", track, name, track->styles[i].Name); | |
175 return i; // use the first style | |
176 } | |
177 | |
178 static uint32_t string2color(char* p) { | |
179 uint32_t tmp; | |
180 (void)strtocolor(&p, &tmp); | |
181 return tmp; | |
182 } | |
183 | |
184 static long long string2timecode(char* p) { | |
185 unsigned h, m, s, ms; | |
186 long long tm; | |
187 int res = sscanf(p, "%1d:%2d:%2d.%2d", &h, &m, &s, &ms); | |
188 if (res < 4) { | |
189 mp_msg(MSGT_GLOBAL, MSGL_WARN, "bad timestamp\n"); | |
190 return 0; | |
191 } | |
192 tm = ((h * 60 + m) * 60 + s) * 1000 + ms * 10; | |
193 return tm; | |
194 } | |
195 | |
196 /** | |
197 * \brief converts numpad-style align to align. | |
198 */ | |
199 static int numpad2align(int val) { | |
200 int res, v; | |
201 v = (val - 1) / 3; // 0, 1 or 2 for vertical alignment | |
202 if (v != 0) v = 3 - v; | |
203 res = ((val - 1) % 3) + 1; // horizontal alignment | |
204 res += v*4; | |
205 return res; | |
206 } | |
207 | |
208 #define NEXT(str,token) \ | |
209 token = next_token(&str); \ | |
210 if (!token) break; | |
211 | |
212 #define ANYVAL(name,func) \ | |
213 } else if (strcasecmp(tname, #name) == 0) { \ | |
214 target->name = func(token); \ | |
215 mp_msg(MSGT_GLOBAL, MSGL_DBG2, "%s = %s\n", #name, token); | |
19495 | 216 |
217 #define STRVAL(name) \ | |
218 } else if (strcasecmp(tname, #name) == 0) { \ | |
219 if (target->name != NULL) free(target->name); \ | |
220 target->name = strdup(token); \ | |
221 mp_msg(MSGT_GLOBAL, MSGL_DBG2, "%s = %s\n", #name, token); | |
222 | |
18937 | 223 #define COLORVAL(name) ANYVAL(name,string2color) |
224 #define INTVAL(name) ANYVAL(name,atoi) | |
225 #define FPVAL(name) ANYVAL(name,atof) | |
226 #define TIMEVAL(name) ANYVAL(name,string2timecode) | |
227 #define STYLEVAL(name) \ | |
228 } else if (strcasecmp(tname, #name) == 0) { \ | |
229 target->name = lookup_style(track, token); \ | |
230 mp_msg(MSGT_GLOBAL, MSGL_DBG2, "%s = %s\n", #name, token); | |
231 | |
232 #define ALIAS(alias,name) \ | |
233 if (strcasecmp(tname, #alias) == 0) {tname = #name;} | |
234 | |
235 static char* next_token(char** str) { | |
236 char* p = *str; | |
237 char* start; | |
238 skip_spaces(&p); | |
239 if (*p == '\0') { | |
240 *str = p; | |
241 return 0; | |
242 } | |
243 start = p; // start of the token | |
244 for (; (*p != '\0') && (*p != ','); ++p) {} | |
245 if (*p == '\0') { | |
246 *str = p; // eos found, str will point to '\0' at exit | |
247 } else { | |
248 *p = '\0'; | |
249 *str = p + 1; // ',' found, str will point to the next char (beginning of the next token) | |
250 } | |
251 --p; // end of current token | |
252 rskip_spaces(&p, start); | |
253 if (p < start) | |
254 p = start; // empty token | |
255 else | |
256 ++p; // the first space character, or '\0' | |
257 *p = '\0'; | |
258 return start; | |
259 } | |
260 /** | |
261 * \brief Parse the tail of Dialogue line | |
262 * \param track track | |
263 * \param event parsed data goes here | |
264 * \param str string to parse, zero-terminated | |
265 * \param n_ignored number of format options to skip at the beginning | |
266 */ | |
267 static int process_event_tail(ass_track_t* track, ass_event_t* event, char* str, int n_ignored) | |
268 { | |
269 char* token; | |
270 char* tname; | |
271 char* p = str; | |
272 int i; | |
273 ass_event_t* target = event; | |
274 | |
275 char* format = strdup(track->event_format); | |
276 char* q = format; // format scanning pointer | |
277 | |
278 for (i = 0; i < n_ignored; ++i) { | |
279 NEXT(q, tname); | |
280 } | |
281 | |
282 while (1) { | |
283 NEXT(q, tname); | |
284 if (strcasecmp(tname, "Text") == 0) { | |
285 char* last; | |
286 event->Text = strdup(p); | |
19612 | 287 if (*event->Text != 0) { |
288 last = event->Text + strlen(event->Text) - 1; | |
289 if (last >= event->Text && *last == '\r') | |
290 *last = 0; | |
291 } | |
18937 | 292 mp_msg(MSGT_GLOBAL, MSGL_DBG2, "Text = %s\n", event->Text); |
293 event->Duration -= event->Start; | |
294 free(format); | |
295 return 0; // "Text" is always the last | |
296 } | |
297 NEXT(p, token); | |
298 | |
299 ALIAS(End,Duration) // temporarily store end timecode in event->Duration | |
300 if (0) { // cool ;) | |
19635 | 301 INTVAL(Layer) |
18937 | 302 STYLEVAL(Style) |
303 STRVAL(Name) | |
304 STRVAL(Effect) | |
305 INTVAL(MarginL) | |
306 INTVAL(MarginR) | |
307 INTVAL(MarginV) | |
308 TIMEVAL(Start) | |
309 TIMEVAL(Duration) | |
310 } | |
311 } | |
312 free(format); | |
313 return 1; | |
314 } | |
315 | |
316 /** | |
19495 | 317 * \brief Parse command line style overrides (--ass-force-style option) |
318 * \param track track to apply overrides to | |
319 * The format for overrides is [StyleName.]Field=Value | |
320 */ | |
19584
586e7d259d05
Apply -ass-force-style also to tracks generated from subdata.
eugeni
parents:
19567
diff
changeset
|
321 void process_force_style(ass_track_t* track) { |
19495 | 322 char **fs, *eq, *dt, *style, *tname, *token; |
323 ass_style_t* target; | |
324 int sid; | |
325 | |
326 if (!ass_force_style_list) return; | |
327 | |
328 for (fs = ass_force_style_list; *fs; ++fs) { | |
329 eq = strchr(*fs, '='); | |
330 if (!eq) | |
331 continue; | |
332 *eq = '\0'; | |
333 token = eq + 1; | |
334 | |
335 dt = strchr(*fs, '.'); | |
336 if (dt) { | |
337 *dt = '\0'; | |
338 style = *fs; | |
339 tname = dt + 1; | |
340 } else { | |
341 style = NULL; | |
342 tname = *fs; | |
343 } | |
344 for (sid = 0; sid < track->n_styles; ++sid) { | |
345 if (style == NULL || strcasecmp(track->styles[sid].Name, style) == 0) { | |
346 target = track->styles + sid; | |
347 if (0) { | |
348 STRVAL(FontName) | |
349 COLORVAL(PrimaryColour) | |
350 COLORVAL(SecondaryColour) | |
351 COLORVAL(OutlineColour) | |
352 COLORVAL(BackColour) | |
353 INTVAL(FontSize) | |
354 INTVAL(Bold) | |
355 INTVAL(Italic) | |
356 INTVAL(Underline) | |
357 INTVAL(StrikeOut) | |
358 INTVAL(Spacing) | |
359 INTVAL(Angle) | |
360 INTVAL(BorderStyle) | |
361 INTVAL(Alignment) | |
362 INTVAL(MarginL) | |
363 INTVAL(MarginR) | |
364 INTVAL(MarginV) | |
365 INTVAL(Encoding) | |
366 FPVAL(ScaleX) | |
367 FPVAL(ScaleY) | |
368 FPVAL(Outline) | |
369 FPVAL(Shadow) | |
370 } | |
371 } | |
372 } | |
373 *eq = '='; | |
374 if (dt) *dt = '.'; | |
375 } | |
376 } | |
377 | |
378 /** | |
18937 | 379 * \brief Parse the Style line |
380 * \param track track | |
381 * \param str string to parse, zero-terminated | |
382 * Allocates a new style struct. | |
383 */ | |
384 static int process_style(ass_track_t* track, char *str) | |
385 { | |
386 | |
387 char* token; | |
388 char* tname; | |
389 char* p = str; | |
390 char* format; | |
391 char* q; // format scanning pointer | |
392 int sid; | |
393 ass_style_t* style; | |
394 ass_style_t* target; | |
395 | |
396 if (!track->style_format) { | |
397 // no style format header | |
398 // probably an ancient script version | |
399 if (track->track_type == TRACK_TYPE_SSA) | |
400 track->style_format = strdup("Name, Fontname, Fontsize, PrimaryColour, SecondaryColour," | |
401 "TertiaryColour, BackColour, Bold, Italic, BorderStyle, Outline," | |
402 "Shadow, Alignment, MarginL, MarginR, MarginV, AlphaLevel, Encoding"); | |
403 else | |
404 track->style_format = strdup("Name, Fontname, Fontsize, PrimaryColour, SecondaryColour," | |
405 "OutlineColour, BackColour, Bold, Italic, Underline, StrikeOut," | |
406 "ScaleX, ScaleY, Spacing, Angle, BorderStyle, Outline, Shadow," | |
407 "Alignment, MarginL, MarginR, MarginV, Encoding"); | |
408 } | |
409 | |
410 q = format = strdup(track->style_format); | |
411 | |
412 mp_msg(MSGT_GLOBAL, MSGL_V, "[%p] Style: %s\n", track, str); | |
413 | |
414 sid = ass_alloc_style(track); | |
415 | |
416 style = track->styles + sid; | |
417 target = style; | |
418 // fill style with some default values | |
419 style->ScaleX = 100.; | |
420 style->ScaleY = 100.; | |
421 | |
422 while (1) { | |
423 NEXT(q, tname); | |
424 NEXT(p, token); | |
425 | |
426 // ALIAS(TertiaryColour,OutlineColour) // ignore TertiaryColour; it appears only in SSA, and is overridden by BackColour | |
427 | |
428 if (0) { // cool ;) | |
429 STRVAL(Name) | |
430 if ((strcmp(target->Name, "Default")==0) || (strcmp(target->Name, "*Default")==0)) | |
431 track->default_style = sid; | |
432 STRVAL(FontName) | |
433 COLORVAL(PrimaryColour) | |
434 COLORVAL(SecondaryColour) | |
435 COLORVAL(OutlineColour) // TertiaryColor | |
436 COLORVAL(BackColour) | |
437 // SSA uses BackColour for both outline and shadow | |
438 // this will destroy SSA's TertiaryColour, but i'm not going to use it anyway | |
439 if (track->track_type == TRACK_TYPE_SSA) | |
440 target->OutlineColour = target->BackColour; | |
441 INTVAL(FontSize) | |
442 INTVAL(Bold) | |
443 INTVAL(Italic) | |
444 INTVAL(Underline) | |
445 INTVAL(StrikeOut) | |
446 INTVAL(Spacing) | |
447 INTVAL(Angle) | |
448 INTVAL(BorderStyle) | |
449 INTVAL(Alignment) | |
450 if (track->track_type == TRACK_TYPE_ASS) | |
451 target->Alignment = numpad2align(target->Alignment); | |
452 INTVAL(MarginL) | |
453 INTVAL(MarginR) | |
454 INTVAL(MarginV) | |
455 INTVAL(Encoding) | |
456 FPVAL(ScaleX) | |
457 FPVAL(ScaleY) | |
458 FPVAL(Outline) | |
459 FPVAL(Shadow) | |
460 } | |
461 } | |
462 style->ScaleX /= 100.; | |
463 style->ScaleY /= 100.; | |
464 if (!style->Name) | |
465 style->Name = strdup("Default"); | |
466 if (!style->FontName) | |
467 style->FontName = strdup("Arial"); | |
468 free(format); | |
469 return 0; | |
470 | |
471 } | |
472 | |
19492 | 473 static int process_styles_line(ass_track_t* track, char *str) |
474 { | |
475 if (!strncmp(str,"Format:", 7)) { | |
476 char* p = str + 7; | |
477 skip_spaces(&p); | |
478 track->style_format = strdup(p); | |
479 mp_msg(MSGT_GLOBAL, MSGL_DBG2, "Style format: %s\n", track->style_format); | |
480 } else if (!strncmp(str,"Style:", 6)) { | |
481 char* p = str + 6; | |
482 skip_spaces(&p); | |
483 process_style(track, p); | |
484 } | |
485 return 0; | |
486 } | |
487 | |
488 static int process_info_line(ass_track_t* track, char *str) | |
489 { | |
490 if (!strncmp(str, "PlayResX:", 9)) { | |
491 track->PlayResX = atoi(str + 9); | |
492 } else if (!strncmp(str,"PlayResY:", 9)) { | |
493 track->PlayResY = atoi(str + 9); | |
494 } else if (!strncmp(str,"Timer:", 6)) { | |
495 track->Timer = atof(str + 6); | |
496 } else if (!strncmp(str,"WrapStyle:", 10)) { | |
497 track->WrapStyle = atoi(str + 10); | |
498 } | |
499 return 0; | |
500 } | |
501 | |
502 static int process_events_line(ass_track_t* track, char *str) | |
503 { | |
504 if (!strncmp(str, "Format:", 7)) { | |
505 char* p = str + 7; | |
506 skip_spaces(&p); | |
507 track->event_format = strdup(p); | |
508 mp_msg(MSGT_GLOBAL, MSGL_DBG2, "Event format: %s\n", track->event_format); | |
509 } else if (!strncmp(str, "Dialogue:", 9)) { | |
510 // This should never be reached for embedded subtitles. | |
511 // They have slightly different format and are parsed in ass_process_chunk, | |
512 // called directly from demuxer | |
513 int eid; | |
514 ass_event_t* event; | |
515 | |
516 str += 9; | |
517 skip_spaces(&str); | |
518 | |
519 eid = ass_alloc_event(track); | |
520 event = track->events + eid; | |
521 | |
522 process_event_tail(track, event, str, 0); | |
523 } else { | |
524 mp_msg(MSGT_GLOBAL, MSGL_V, "Not understood: %s \n", str); | |
525 } | |
526 return 0; | |
527 } | |
528 | |
529 // Copied from mkvtoolnix | |
530 static unsigned char* decode_chars(unsigned char c1, unsigned char c2, | |
531 unsigned char c3, unsigned char c4, unsigned char* dst, int cnt) | |
532 { | |
533 uint32_t value; | |
534 unsigned char bytes[3]; | |
535 int i; | |
536 | |
537 value = ((c1 - 33) << 18) + ((c2 - 33) << 12) + ((c3 - 33) << 6) + (c4 - 33); | |
538 bytes[2] = value & 0xff; | |
539 bytes[1] = (value & 0xff00) >> 8; | |
540 bytes[0] = (value & 0xff0000) >> 16; | |
541 | |
542 for (i = 0; i < cnt; ++i) | |
543 *dst++ = bytes[i]; | |
544 return dst; | |
545 } | |
546 | |
547 static int decode_font(ass_track_t* track) | |
548 { | |
549 unsigned char* p; | |
550 unsigned char* q; | |
551 int i; | |
552 int size; // original size | |
553 int dsize; // decoded size | |
554 unsigned char* buf = 0; | |
555 | |
556 mp_msg(MSGT_GLOBAL, MSGL_V, "font: %d bytes encoded data \n", track->parser_priv->fontdata_used); | |
557 size = track->parser_priv->fontdata_used; | |
558 if (size % 4 == 1) { | |
559 mp_msg(MSGT_GLOBAL, MSGL_ERR, "bad encoded data size\n"); | |
560 goto error_decode_font; | |
561 } | |
562 buf = malloc(size / 4 * 3 + 2); | |
563 q = buf; | |
564 for (i = 0, p = (unsigned char*)track->parser_priv->fontdata; i < size / 4; i++, p+=4) { | |
565 q = decode_chars(p[0], p[1], p[2], p[3], q, 3); | |
566 } | |
567 if (size % 4 == 2) { | |
568 q = decode_chars(p[0], p[1], 0, 0, q, 1); | |
569 } else if (size % 4 == 3) { | |
570 q = decode_chars(p[0], p[1], p[2], 0, q, 2); | |
571 } | |
572 dsize = q - buf; | |
573 assert(dsize <= size / 4 * 3 + 2); | |
574 | |
575 if (extract_embedded_fonts) | |
576 ass_process_font(track->parser_priv->fontname, (char*)buf, dsize); | |
577 | |
578 error_decode_font: | |
579 if (buf) free(buf); | |
580 free(track->parser_priv->fontname); | |
581 free(track->parser_priv->fontdata); | |
582 track->parser_priv->fontname = 0; | |
583 track->parser_priv->fontdata = 0; | |
584 track->parser_priv->fontdata_size = 0; | |
585 track->parser_priv->fontdata_used = 0; | |
586 return 0; | |
587 } | |
588 | |
589 static char* validate_fname(char* name); | |
590 | |
591 static int process_fonts_line(ass_track_t* track, char *str) | |
592 { | |
593 int len; | |
594 | |
595 if (!strncmp(str, "fontname:", 9)) { | |
596 char* p = str + 9; | |
597 skip_spaces(&p); | |
598 if (track->parser_priv->fontname) { | |
599 decode_font(track); | |
600 } | |
601 track->parser_priv->fontname = validate_fname(p); | |
602 mp_msg(MSGT_GLOBAL, MSGL_V, "fontname: %s\n", track->parser_priv->fontname); | |
603 return 0; | |
604 } | |
605 | |
606 if (!track->parser_priv->fontname) { | |
607 mp_msg(MSGT_GLOBAL, MSGL_V, "Not understood: %s \n", str); | |
608 return 0; | |
609 } | |
610 | |
611 len = strlen(str); | |
612 if (len > 80) { | |
613 mp_msg(MSGT_GLOBAL, MSGL_WARN, "Font line too long: %d, %s\n", len, str); | |
614 return 0; | |
615 } | |
616 if (track->parser_priv->fontdata_used + len > track->parser_priv->fontdata_size) { | |
617 track->parser_priv->fontdata_size += 100 * 1024; | |
618 track->parser_priv->fontdata = realloc(track->parser_priv->fontdata, track->parser_priv->fontdata_size); | |
619 } | |
620 memcpy(track->parser_priv->fontdata + track->parser_priv->fontdata_used, str, len); | |
621 track->parser_priv->fontdata_used += len; | |
622 | |
623 return 0; | |
624 } | |
625 | |
18937 | 626 /** |
627 * \brief Parse a header line | |
628 * \param track track | |
629 * \param str string to parse, zero-terminated | |
630 */ | |
19492 | 631 static int process_line(ass_track_t* track, char *str) |
18937 | 632 { |
19492 | 633 if (strstr(str, "[Script Info]")) { // FIXME: strstr to skip possible BOM at the beginning of the script |
634 track->parser_priv->state = PST_INFO; | |
635 } else if (!strncmp(str, "[V4 Styles]", 11)) { | |
636 track->parser_priv->state = PST_STYLES; | |
637 track->track_type = TRACK_TYPE_SSA; | |
638 } else if (!strncmp(str, "[V4+ Styles]", 12)) { | |
639 track->parser_priv->state = PST_STYLES; | |
640 track->track_type = TRACK_TYPE_ASS; | |
641 } else if (!strncmp(str, "[Events]", 8)) { | |
642 track->parser_priv->state = PST_EVENTS; | |
643 } else if (!strncmp(str, "[Fonts]", 7)) { | |
644 track->parser_priv->state = PST_FONTS; | |
645 } else { | |
646 switch (track->parser_priv->state) { | |
647 case PST_INFO: | |
648 process_info_line(track, str); | |
649 break; | |
650 case PST_STYLES: | |
651 process_styles_line(track, str); | |
652 break; | |
653 case PST_EVENTS: | |
654 process_events_line(track, str); | |
655 break; | |
656 case PST_FONTS: | |
657 process_fonts_line(track, str); | |
658 break; | |
659 default: | |
660 break; | |
18937 | 661 } |
19492 | 662 } |
663 | |
664 // there is no explicit end-of-font marker in ssa/ass | |
665 if ((track->parser_priv->state != PST_FONTS) && (track->parser_priv->fontname)) | |
666 decode_font(track); | |
667 | |
668 return 0; | |
669 } | |
670 | |
671 static int process_text(ass_track_t* track, char* str) | |
672 { | |
673 char* p = str; | |
674 while(1) { | |
675 char* q; | |
676 for (;((*p=='\r')||(*p=='\n'));++p) {} | |
677 for (q=p; ((*q!='\0')&&(*q!='\r')&&(*q!='\n')); ++q) {}; | |
678 if (q==p) | |
679 break; | |
680 if (*q != '\0') | |
681 *(q++) = '\0'; | |
682 process_line(track, p); | |
683 if (*q == '\0') | |
684 break; | |
685 p = q; | |
18937 | 686 } |
687 return 0; | |
688 } | |
689 | |
690 /** | |
691 * \brief Process CodecPrivate section of subtitle stream | |
692 * \param track track | |
693 * \param data string to parse | |
694 * \param size length of data | |
19492 | 695 CodecPrivate section contains [Stream Info] and [V4+ Styles] ([V4 Styles] for SSA) sections |
18937 | 696 */ |
19492 | 697 void ass_process_codec_private(ass_track_t* track, char *data, int size) |
18937 | 698 { |
699 char* str = malloc(size + 1); | |
700 int sid; | |
701 | |
702 memcpy(str, data, size); | |
703 str[size] = '\0'; | |
704 | |
19492 | 705 process_text(track, str); |
18937 | 706 free(str); |
707 | |
708 // add "Default" style to the end | |
709 // will be used if track does not contain a default style (or even does not contain styles at all) | |
710 sid = ass_alloc_style(track); | |
711 track->styles[sid].Name = strdup("Default"); | |
712 track->styles[sid].FontName = strdup("Arial"); | |
713 | |
714 if (!track->event_format) { | |
715 // probably an mkv produced by ancient mkvtoolnix | |
716 // such files don't have [Events] and Format: headers | |
19492 | 717 track->parser_priv->state = PST_EVENTS; |
18937 | 718 if (track->track_type == TRACK_TYPE_SSA) |
719 track->event_format = strdup("Format: Marked, Start, End, Style, Name, MarginL, MarginR, MarginV, Effect, Text"); | |
720 else | |
721 track->event_format = strdup("Format: Layer, Start, End, Style, Actor, MarginL, MarginR, MarginV, Effect, Text"); | |
722 } | |
19495 | 723 |
724 process_force_style(track); | |
18937 | 725 } |
726 | |
727 static int check_duplicate_event(ass_track_t* track, int ReadOrder) | |
728 { | |
729 int i; | |
730 for (i = 0; i<track->n_events - 1; ++i) // ignoring last event, it is the one we are comparing with | |
731 if (track->events[i].ReadOrder == ReadOrder) | |
732 return 1; | |
733 return 0; | |
734 } | |
735 | |
736 /** | |
737 * \brief Process a chunk of subtitle stream data. In matroska, this containes exactly 1 event (or a commentary) | |
738 * \param track track | |
739 * \param data string to parse | |
740 * \param size length of data | |
741 * \param timecode starting time of the event (milliseconds) | |
742 * \param duration duration of the event (milliseconds) | |
743 */ | |
19492 | 744 void ass_process_chunk(ass_track_t* track, char *data, int size, long long timecode, long long duration) |
18937 | 745 { |
746 char* str; | |
747 int eid; | |
748 char* p; | |
749 char* token; | |
750 ass_event_t* event; | |
751 | |
752 if (!track->event_format) { | |
753 mp_msg(MSGT_GLOBAL, MSGL_WARN, "Event format header missing\n"); | |
754 return; | |
755 } | |
756 | |
757 str = malloc(size + 1); | |
758 memcpy(str, data, size); | |
759 str[size] = '\0'; | |
19378 | 760 mp_msg(MSGT_GLOBAL, MSGL_V, "event at %" PRId64 ", +%" PRId64 ": %s \n", (int64_t)timecode, (int64_t)duration, str); |
18937 | 761 |
762 eid = ass_alloc_event(track); | |
763 event = track->events + eid; | |
764 | |
765 p = str; | |
766 | |
767 do { | |
768 NEXT(p, token); | |
769 event->ReadOrder = atoi(token); | |
770 if (check_duplicate_event(track, event->ReadOrder)) | |
771 break; | |
772 | |
773 NEXT(p, token); | |
774 event->Layer = atoi(token); | |
775 | |
776 process_event_tail(track, event, p, 3); | |
777 | |
778 event->Start = timecode; | |
779 event->Duration = duration; | |
780 | |
781 free(str); | |
782 return; | |
783 // dump_events(tid); | |
784 } while (0); | |
785 // some error | |
19474
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
786 ass_free_event(track, eid); |
07209f48e527
Add public functions for removal of styles and events.
eugeni
parents:
19405
diff
changeset
|
787 track->n_events--; |
18937 | 788 free(str); |
789 } | |
790 | |
791 #ifdef USE_ICONV | |
792 /** \brief recode buffer to utf-8 | |
793 * constraint: sub_cp != 0 | |
794 * \param data pointer to text buffer | |
795 * \param size buffer size | |
796 * \return a pointer to recoded buffer, caller is responsible for freeing it | |
797 **/ | |
798 static char* sub_recode(char* data, size_t size) | |
799 { | |
800 static iconv_t icdsc = (iconv_t)(-1); | |
801 char* tocp = "UTF-8"; | |
802 char* outbuf; | |
803 assert(sub_cp); | |
804 | |
805 { | |
806 char* cp_tmp = sub_cp; | |
807 #ifdef HAVE_ENCA | |
808 char enca_lang[3], enca_fallback[100]; | |
809 if (sscanf(sub_cp, "enca:%2s:%99s", enca_lang, enca_fallback) == 2 | |
810 || sscanf(sub_cp, "ENCA:%2s:%99s", enca_lang, enca_fallback) == 2) { | |
811 cp_tmp = guess_buffer_cp((unsigned char*)data, size, enca_lang, enca_fallback); | |
812 } | |
813 #endif | |
814 if ((icdsc = iconv_open (tocp, cp_tmp)) != (iconv_t)(-1)){ | |
815 mp_msg(MSGT_SUBREADER,MSGL_V,"LIBSUB: opened iconv descriptor.\n"); | |
816 } else | |
817 mp_msg(MSGT_SUBREADER,MSGL_ERR,"LIBSUB: error opening iconv descriptor.\n"); | |
818 #ifdef HAVE_ENCA | |
819 if (cp_tmp) free(cp_tmp); | |
820 #endif | |
821 } | |
822 | |
823 { | |
824 size_t osize = size; | |
825 size_t ileft = size; | |
826 size_t oleft = size - 1; | |
827 char* ip; | |
828 char* op; | |
829 size_t rc; | |
830 | |
831 outbuf = malloc(size); | |
832 ip = data; | |
833 op = outbuf; | |
834 | |
835 while (ileft) { | |
836 rc = iconv(icdsc, &ip, &ileft, &op, &oleft); | |
837 if (rc == (size_t)(-1)) { | |
838 if (errno == E2BIG) { | |
839 int offset = op - outbuf; | |
840 outbuf = (char*)realloc(outbuf, osize + size); | |
841 op = outbuf + offset; | |
842 osize += size; | |
843 oleft += size; | |
844 } else { | |
845 mp_msg(MSGT_SUBREADER, MSGL_WARN, "LIBSUB: error recoding file.\n"); | |
846 return NULL; | |
847 } | |
848 } | |
849 } | |
850 outbuf[osize - oleft - 1] = 0; | |
851 } | |
852 | |
853 if (icdsc != (iconv_t)(-1)) { | |
854 (void)iconv_close(icdsc); | |
855 icdsc = (iconv_t)(-1); | |
856 mp_msg(MSGT_SUBREADER,MSGL_V,"LIBSUB: closed iconv descriptor.\n"); | |
857 } | |
858 | |
859 return outbuf; | |
860 } | |
861 #endif // ICONV | |
862 | |
863 /** | |
864 * \brief Read subtitles from file. | |
865 * \param fname file name | |
866 * \return newly allocated track | |
867 */ | |
868 ass_track_t* ass_read_file(char* fname) | |
869 { | |
870 int res; | |
871 long sz; | |
872 long bytes_read; | |
873 char* buf; | |
874 ass_track_t* track; | |
875 | |
876 FILE* fp = fopen(fname, "rb"); | |
877 if (!fp) { | |
878 mp_msg(MSGT_GLOBAL, MSGL_WARN, "ass_read_file(%s): fopen failed\n", fname); | |
879 return 0; | |
880 } | |
881 res = fseek(fp, 0, SEEK_END); | |
882 if (res == -1) { | |
883 mp_msg(MSGT_GLOBAL, MSGL_WARN, "ass_read_file(%s): fseek failed\n", fname); | |
884 fclose(fp); | |
885 return 0; | |
886 } | |
887 | |
888 sz = ftell(fp); | |
889 rewind(fp); | |
890 | |
891 if (sz > 10*1024*1024) { | |
892 mp_msg(MSGT_GLOBAL, MSGL_INFO, "ass_read_file(%s): Refusing to load subtitles larger than 10M\n", fname); | |
893 fclose(fp); | |
894 return 0; | |
895 } | |
896 | |
897 mp_msg(MSGT_GLOBAL, MSGL_V, "file size: %ld\n", sz); | |
898 | |
899 buf = malloc(sz + 1); | |
900 assert(buf); | |
901 bytes_read = 0; | |
902 do { | |
903 res = fread(buf + bytes_read, 1, sz - bytes_read, fp); | |
904 if (res <= 0) { | |
905 mp_msg(MSGT_GLOBAL, MSGL_INFO, "Read failed, %d: %s\n", errno, strerror(errno)); | |
906 fclose(fp); | |
907 free(buf); | |
908 return 0; | |
909 } | |
910 bytes_read += res; | |
911 } while (sz - bytes_read > 0); | |
912 buf[sz] = '\0'; | |
913 fclose(fp); | |
914 | |
915 #ifdef USE_ICONV | |
916 if (sub_cp) { | |
917 char* tmpbuf = sub_recode(buf, sz); | |
918 free(buf); | |
919 if (!tmpbuf) | |
920 return 0; | |
921 buf = tmpbuf; | |
922 } | |
923 #endif | |
924 | |
925 track = ass_new_track(); | |
926 track->name = strdup(fname); | |
927 | |
928 // process header | |
19492 | 929 process_text(track, buf); |
930 | |
931 // there is no explicit end-of-font marker in ssa/ass | |
932 if (track->parser_priv->fontname) | |
933 decode_font(track); | |
934 | |
18937 | 935 free(buf); |
936 | |
19492 | 937 if (track->track_type == TRACK_TYPE_UNKNOWN) { |
18937 | 938 ass_free_track(track); |
939 return 0; | |
940 } | |
941 | |
19495 | 942 process_force_style(track); |
943 | |
18937 | 944 mp_msg(MSGT_GLOBAL, MSGL_INFO, "LIBASS: added subtitle file: %s (%d styles, %d events)\n", fname, track->n_styles, track->n_events); |
945 | |
946 sort_events(track); | |
947 | |
948 // dump_events(forced_tid); | |
949 return track; | |
950 } | |
951 | |
952 static char* validate_fname(char* name) | |
953 { | |
954 char* fname; | |
955 char* p; | |
956 char* q; | |
957 unsigned code; | |
958 int sz = strlen(name); | |
959 | |
960 q = fname = malloc(sz + 1); | |
961 p = name; | |
962 while (*p) { | |
963 code = utf8_get_char(&p); | |
964 if (code == 0) | |
965 break; | |
966 if ( (code > 0x7F) || | |
967 (code == '\\') || | |
968 (code == '/') || | |
969 (code == ':') || | |
970 (code == '*') || | |
971 (code == '?') || | |
972 (code == '<') || | |
973 (code == '>') || | |
974 (code == '|') || | |
975 (code == 0)) | |
976 { | |
977 *q++ = '_'; | |
978 } else { | |
979 *q++ = code; | |
980 } | |
981 if (p - name > sz) | |
982 break; | |
983 } | |
984 *q = 0; | |
985 return fname; | |
986 } | |
987 | |
988 /** | |
989 * \brief Process embedded matroska font. Saves it to ~/.mplayer/fonts. | |
990 * \param name attachment name | |
991 * \param data binary font data | |
992 * \param data_size data size | |
993 */ | |
994 void ass_process_font(const char* name, char* data, int data_size) | |
995 { | |
996 char buf[1000]; | |
997 FILE* fp = 0; | |
998 int rc; | |
999 struct stat st; | |
1000 char* fname; | |
1001 | |
1002 char* fonts_dir = get_path("fonts"); | |
1003 rc = stat(fonts_dir, &st); | |
1004 if (rc) { | |
1005 int res; | |
1006 #ifndef __MINGW32__ | |
1007 res = mkdir(fonts_dir, 0700); | |
1008 #else | |
1009 res = mkdir(fonts_dir); | |
1010 #endif | |
1011 if (res) { | |
1012 mp_msg(MSGT_GLOBAL, MSGL_WARN, "Failed to create: %s\n", fonts_dir); | |
1013 } | |
1014 } else if (!S_ISDIR(st.st_mode)) { | |
1015 mp_msg(MSGT_GLOBAL, MSGL_WARN, "Not a directory: %s\n", fonts_dir); | |
1016 } | |
1017 | |
1018 fname = validate_fname((char*)name); | |
1019 | |
1020 snprintf(buf, 1000, "%s/%s", fonts_dir, fname); | |
1021 free(fname); | |
1022 free(fonts_dir); | |
1023 | |
1024 fp = fopen(buf, "wb"); | |
1025 if (!fp) return; | |
1026 | |
1027 fwrite(data, data_size, 1, fp); | |
1028 fclose(fp); | |
1029 } | |
1030 | |
1031 long long ass_step_sub(ass_track_t* track, long long now, int movement) { | |
1032 int i; | |
1033 | |
1034 if (movement == 0) return 0; | |
1035 if (track->n_events == 0) return 0; | |
1036 | |
1037 if (movement < 0) | |
1038 for (i = 0; (i < track->n_events) && ((long long)(track->events[i].Start + track->events[i].Duration) <= now); ++i) {} | |
1039 else | |
1040 for (i = track->n_events - 1; (i >= 0) && ((long long)(track->events[i].Start) > now); --i) {} | |
1041 | |
1042 // -1 and n_events are ok | |
1043 assert(i >= -1); assert(i <= track->n_events); | |
1044 i += movement; | |
1045 if (i < 0) i = 0; | |
1046 if (i >= track->n_events) i = track->n_events - 1; | |
1047 return ((long long)track->events[i].Start) - now; | |
1048 } | |
1049 | |
1050 ass_track_t* ass_new_track(void) { | |
1051 ass_track_t* track = calloc(1, sizeof(ass_track_t)); | |
19492 | 1052 track->parser_priv = calloc(1, sizeof(parser_priv_t)); |
18937 | 1053 return track; |
1054 } | |
1055 |