2 Copyright (C) 2016 Carl Hetherington <cth@carlh.net>
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
20 #include "ssa_reader.h"
22 #include "sub_assert.h"
23 #include "raw_convert.h"
25 #include <locked_sstream.h>
26 #include <boost/algorithm/string.hpp>
27 #include <boost/bind.hpp>
28 #include <boost/foreach.hpp>
37 using boost::optional;
38 using boost::function;
39 using namespace boost::algorithm;
42 /** @param s Subtitle string encoded in UTF-8 */
43 SSAReader::SSAReader (string const & s)
45 locked_stringstream str (s);
46 this->read (boost::bind (&get_line_stringstream, &str));
49 /** @param f Subtitle file encoded in UTF-8 */
50 SSAReader::SSAReader (FILE* f)
52 this->read (boost::bind (&get_line_file, f));
60 , primary_colour (255, 255, 255)
64 , horizontal_reference (HORIZONTAL_CENTRE_OF_SCREEN)
65 , vertical_reference (BOTTOM_OF_SCREEN)
69 Style (string format_line, string style_line)
71 , primary_colour (255, 255, 255)
75 , horizontal_reference (HORIZONTAL_CENTRE_OF_SCREEN)
76 , vertical_reference (BOTTOM_OF_SCREEN)
80 split (keys, format_line, boost::is_any_of (","));
82 split (style, style_line, boost::is_any_of (","));
84 SUB_ASSERT (!keys.empty());
85 SUB_ASSERT (!style.empty());
86 SUB_ASSERT (keys.size() == style.size());
88 for (size_t i = 0; i < style.size(); ++i) {
91 if (keys[i] == "Name") {
93 } else if (keys[i] == "Fontname") {
95 } else if (keys[i] == "Fontsize") {
96 font_size = raw_convert<int> (style[i]);
97 } else if (keys[i] == "PrimaryColour") {
98 primary_colour = colour (raw_convert<int> (style[i]));
99 } else if (keys[i] == "BackColour") {
100 back_colour = colour (raw_convert<int> (style[i]));
101 } else if (keys[i] == "Bold") {
102 bold = style[i] == "-1";
103 } else if (keys[i] == "Italic") {
104 italic = style[i] == "-1";
105 } else if (keys[i] == "Underline") {
106 underline = style[i] == "-1";
107 } else if (keys[i] == "BorderStyle") {
108 if (style[i] == "1") {
111 } else if (keys[i] == "Alignment") {
112 /* These values from libass' source code */
113 switch ((raw_convert<int> (style[i]) - 1) % 3) {
115 horizontal_reference = LEFT_OF_SCREEN;
118 horizontal_reference = HORIZONTAL_CENTRE_OF_SCREEN;
121 horizontal_reference = RIGHT_OF_SCREEN;
124 switch (raw_convert<int> (style[i]) & 12) {
126 vertical_reference = TOP_OF_SCREEN;
129 vertical_reference = VERTICAL_CENTRE_OF_SCREEN;
132 vertical_reference = BOTTOM_OF_SCREEN;
135 } else if (keys[i] == "MarginV") {
136 vertical_margin = raw_convert<int> (style[i]);
142 optional<string> font_name;
144 Colour primary_colour;
145 /** outline colour */
146 optional<Colour> back_colour;
150 optional<Effect> effect;
151 HorizontalReference horizontal_reference;
152 VerticalReference vertical_reference;
156 Colour colour (int c) const
159 ((c & 0x0000ff) >> 0) / 255.0,
160 ((c & 0x00ff00) >> 8) / 255.0,
161 ((c & 0xff0000) >> 16) / 255.0
167 SSAReader::parse_time (string t) const
170 split (bits, t, is_any_of (":."));
171 SUB_ASSERT (bits.size() == 4);
172 return Time::from_hms (
173 raw_convert<int> (bits[0]),
174 raw_convert<int> (bits[1]),
175 raw_convert<int> (bits[2]),
176 raw_convert<int> (bits[3]) * 10
180 /** @param base RawSubtitle filled in with any required common values.
181 * @param line SSA line string (i.e. just the subtitle, possibly with embedded stuff)
182 * @return List of RawSubtitles to represent line with vertical reference TOP_OF_SUBTITLE.
185 SSAReader::parse_line (RawSubtitle base, string line, int play_res_x, int play_res_y)
193 list<RawSubtitle> subs;
194 RawSubtitle current = base;
197 if (!current.vertical_position.reference) {
198 current.vertical_position.reference = BOTTOM_OF_SCREEN;
201 if (!current.vertical_position.proportional) {
202 current.vertical_position.proportional = 0;
205 /* We must have a font size, as there could be a margin specified
206 in pixels and in that case we must know how big the subtitle
207 lines are to work out the position on screen.
209 if (!current.font_size.points()) {
210 current.font_size.set_points (72);
213 /* Count the number of line breaks */
215 for (size_t i = 0; i < line.length() - 1; ++i) {
216 if (line[i] == '\\' && (line[i+1] == 'n' || line[i+1] == 'N')) {
221 /* Imagine that the screen is 792 points (i.e. 11 inches) high (as with DCP) */
222 double const line_size = current.font_size.proportional(792) * 1.2;
224 /* Tweak vertical_position accordingly */
225 switch (current.vertical_position.reference.get()) {
227 case TOP_OF_SUBTITLE:
230 case VERTICAL_CENTRE_OF_SCREEN:
231 current.vertical_position.proportional = current.vertical_position.proportional.get() - ((line_breaks + 1) * line_size) / 2;
233 case BOTTOM_OF_SCREEN:
234 current.vertical_position.proportional = current.vertical_position.proportional.get() + line_breaks * line_size;
238 for (size_t i = 0; i < line.length(); ++i) {
239 char const c = line[i];
244 } else if (c == '\\') {
246 } else if (c != '\r' && c != '\n') {
251 if (c == '}' || c == '\\') {
252 if (!current.text.empty ()) {
253 subs.push_back (current);
256 if (style == "\\i1") {
257 current.italic = true;
258 } else if (style == "\\i0" || style == "\\i") {
259 current.italic = false;
260 } else if (style == "\\b1") {
262 } else if (style == "\\b0") {
263 current.bold = false;
264 } else if (style == "\\u1") {
265 current.underline = true;
266 } else if (style == "\\u0") {
267 current.underline = false;
268 } else if (style == "\\an1" || style == "\\an2" || style == "\\an3") {
269 current.vertical_position.reference = sub::BOTTOM_OF_SCREEN;
270 } else if (style == "\\an4" || style == "\\an5" || style == "\\an6") {
271 current.vertical_position.reference = sub::VERTICAL_CENTRE_OF_SCREEN;
272 } else if (style == "\\an7" || style == "\\an8" || style == "\\an9") {
273 current.vertical_position.reference = sub::TOP_OF_SCREEN;
274 } else if (boost::starts_with(style, "\\pos")) {
276 boost::algorithm::split (bits, style, boost::is_any_of("(,"));
277 SUB_ASSERT (bits.size() == 3);
278 current.horizontal_position.reference = sub::LEFT_OF_SCREEN;
279 current.horizontal_position.proportional = raw_convert<float>(bits[1]) / play_res_x;
280 current.vertical_position.reference = sub::TOP_OF_SCREEN;
281 current.vertical_position.proportional = raw_convert<float>(bits[2]) / play_res_y;
294 if (c == 'n' || c == 'N') {
295 if (!current.text.empty ()) {
296 subs.push_back (current);
299 /* Move down one line (1.2 times the font size) */
300 if (current.vertical_position.reference.get() == BOTTOM_OF_SCREEN) {
301 current.vertical_position.proportional = current.vertical_position.proportional.get() - line_size;
303 current.vertical_position.proportional = current.vertical_position.proportional.get() + line_size;
311 if (!current.text.empty ()) {
312 subs.push_back (current);
319 SSAReader::read (function<optional<string> ()> get_line)
327 int play_res_x = 288;
328 int play_res_y = 288;
329 map<string, Style> styles;
330 string style_format_line;
331 vector<string> event_format;
334 optional<string> line = get_line ();
340 remove_unicode_bom (line);
342 if (starts_with (*line, ";") || line->empty ()) {
346 if (starts_with (*line, "[")) {
347 /* Section heading */
348 if (line.get() == "[Script Info]") {
350 } else if (line.get() == "[V4 Styles]" || line.get() == "[V4+ Styles]") {
352 } else if (line.get() == "[Events]") {
358 size_t const colon = line->find (":");
359 SUB_ASSERT (colon != string::npos);
360 string const type = line->substr (0, colon);
361 string body = line->substr (colon + 1);
366 if (type == "PlayResX") {
367 play_res_x = raw_convert<int> (body);
368 } else if (type == "PlayResY") {
369 play_res_y = raw_convert<int> (body);
373 if (type == "Format") {
374 style_format_line = body;
375 } else if (type == "Style") {
376 SUB_ASSERT (!style_format_line.empty ());
377 Style s (style_format_line, body);
382 if (type == "Format") {
383 split (event_format, body, is_any_of (","));
384 BOOST_FOREACH (string& i, event_format) {
387 } else if (type == "Dialogue") {
388 SUB_ASSERT (!event_format.empty ());
389 vector<string> event;
390 split (event, body, is_any_of (","));
392 /* There may be commas in the subtitle part; reassemble any extra parts
393 from when we just split it.
395 while (event.size() > event_format.size()) {
396 string const ex = event.back ();
398 event.back() += "," + ex;
401 SUB_ASSERT (!event.empty());
402 SUB_ASSERT (event_format.size() == event.size());
406 for (size_t i = 0; i < event.size(); ++i) {
408 if (event_format[i] == "Start") {
409 sub.from = parse_time (event[i]);
410 } else if (event_format[i] == "End") {
411 sub.to = parse_time (event[i]);
412 } else if (event_format[i] == "Style") {
413 /* libass trims leading '*'s from style names, commenting that
414 "they seem to mean literally nothing". Go figure...
416 trim_left_if (event[i], boost::is_any_of ("*"));
417 SUB_ASSERT (styles.find(event[i]) != styles.end());
418 Style style = styles[event[i]];
419 sub.font = style.font_name;
420 sub.font_size = FontSize::from_points (style.font_size);
421 sub.colour = style.primary_colour;
422 sub.effect_colour = style.back_colour;
423 sub.bold = style.bold;
424 sub.italic = style.italic;
425 sub.underline = style.underline;
426 sub.effect = style.effect;
427 sub.horizontal_position.reference = style.horizontal_reference;
428 sub.vertical_position.reference = style.vertical_reference;
429 sub.vertical_position.proportional = float(style.vertical_margin) / play_res_y;
430 } else if (event_format[i] == "MarginV") {
431 sub.vertical_position.proportional = raw_convert<float>(event[i]) / play_res_y;
432 } else if (event_format[i] == "Text") {
433 BOOST_FOREACH (sub::RawSubtitle j, parse_line (sub, event[i], play_res_x, play_res_y)) {