src/lib/ffmpeg_decoder.cc

   1 /*
   2     Copyright (C) 2012-2018 Carl Hetherington <cth@carlh.net>
   3
   4     This file is part of DCP-o-matic.
   5
   6     DCP-o-matic is free software; you can redistribute it and/or modify
   7     it under the terms of the GNU General Public License as published by
   8     the Free Software Foundation; either version 2 of the License, or
   9     (at your option) any later version.
  10
  11     DCP-o-matic is distributed in the hope that it will be useful,
  12     but WITHOUT ANY WARRANTY; without even the implied warranty of
  13     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14     GNU General Public License for more details.
  15
  16     You should have received a copy of the GNU General Public License
  17     along with DCP-o-matic.  If not, see <http://www.gnu.org/licenses/>.
  18
  19 */
  20
  21
  22 /** @file  src/ffmpeg_decoder.cc
  23  *  @brief A decoder using FFmpeg to decode content.
  24  */
  25
  26
  27 #include "audio_buffers.h"
  28 #include "audio_content.h"
  29 #include "audio_decoder.h"
  30 #include "compose.hpp"
  31 #include "dcpomatic_log.h"
  32 #include "exceptions.h"
  33 #include "ffmpeg_audio_stream.h"
  34 #include "ffmpeg_content.h"
  35 #include "ffmpeg_decoder.h"
  36 #include "ffmpeg_subtitle_stream.h"
  37 #include "film.h"
  38 #include "filter.h"
  39 #include "frame_interval_checker.h"
  40 #include "image.h"
  41 #include "log.h"
  42 #include "raw_image_proxy.h"
  43 #include "text_content.h"
  44 #include "text_decoder.h"
  45 #include "util.h"
  46 #include "video_decoder.h"
  47 #include "video_filter_graph.h"
  48 #include <dcp/subtitle_string.h>
  49 #include <sub/ssa_reader.h>
  50 #include <sub/subtitle.h>
  51 #include <sub/collect.h>
  52 extern "C" {
  53 #include <libavcodec/avcodec.h>
  54 #include <libavformat/avformat.h>
  55 }
  56 #include <boost/algorithm/string.hpp>
  57 #include <iomanip>
  58 #include <iostream>
  59 #include <vector>
  60 #include <stdint.h>
  61
  62 #include "i18n.h"
  63
  64
  65 using std::cout;
  66 using std::dynamic_pointer_cast;
  67 using std::make_shared;
  68 using std::min;
  69 using std::shared_ptr;
  70 using std::string;
  71 using std::vector;
  72 using boost::optional;
  73 using dcp::Size;
  74 using namespace dcpomatic;
  75
  76
  77 FFmpegDecoder::FFmpegDecoder (shared_ptr<const Film> film, shared_ptr<const FFmpegContent> c, bool fast)
  78         : FFmpeg (c)
  79         , Decoder (film)
  80 {
  81         if (c->video && c->video->use()) {
  82                 video = make_shared<VideoDecoder>(this, c);
  83                 _pts_offset = pts_offset (c->ffmpeg_audio_streams(), c->first_video(), c->active_video_frame_rate(film));
  84                 /* It doesn't matter what size or pixel format this is, it just needs to be black */
  85                 _black_image = make_shared<Image>(AV_PIX_FMT_RGB24, dcp::Size (128, 128), Image::Alignment::PADDED);
  86                 _black_image->make_black ();
  87         } else {
  88                 _pts_offset = {};
  89         }
  90
  91         if (c->audio) {
  92                 audio = make_shared<AudioDecoder>(this, c->audio, fast);
  93         }
  94
  95         if (c->only_text()) {
  96                 text.push_back (make_shared<TextDecoder>(this, c->only_text()));
  97                 /* XXX: we should be calling maybe_set_position() on this TextDecoder, but we can't easily find
  98                  * the time of the first subtitle at this point.
  99                  */
 100         }
 101
 102         for (auto i: c->ffmpeg_audio_streams()) {
 103                 _next_time[i] = boost::optional<dcpomatic::ContentTime>();
 104         }
 105 }
 106
 107
 108 bool
 109 FFmpegDecoder::flush ()
 110 {
 111         /* Flush video and audio once */
 112
 113         bool did_something = false;
 114         if (video) {
 115                 if (decode_and_process_video_packet(nullptr)) {
 116                         did_something = true;
 117                 }
 118         }
 119
 120         for (auto i: ffmpeg_content()->ffmpeg_audio_streams()) {
 121                 auto context = _codec_context[i->index(_format_context)];
 122                 int r = avcodec_send_packet (context, nullptr);
 123                 if (r < 0 && r != AVERROR_EOF) {
 124                         /* EOF can happen if we've already sent a flush packet */
 125                         throw DecodeError (N_("avcodec_send_packet"), N_("FFmpegDecoder::flush"), r);
 126                 }
 127                 r = avcodec_receive_frame (context, audio_frame(i));
 128                 if (r >= 0) {
 129                         process_audio_frame (i);
 130                         did_something = true;
 131                 }
 132         }
 133
 134         if (did_something) {
 135                 /* We want to be called again */
 136                 return false;
 137         }
 138
 139         /* Make sure all streams are the same length and round up to the next video frame */
 140
 141         auto const frc = film()->active_frame_rate_change(_ffmpeg_content->position());
 142         ContentTime full_length (_ffmpeg_content->full_length(film()), frc);
 143         full_length = full_length.ceil (frc.source);
 144         if (video) {
 145                 double const vfr = _ffmpeg_content->video_frame_rate().get();
 146                 auto const f = full_length.frames_round (vfr);
 147                 auto v = video->position(film()).get_value_or(ContentTime()).frames_round(vfr) + 1;
 148                 while (v < f) {
 149                         video->emit (film(), make_shared<const RawImageProxy>(_black_image), v);
 150                         ++v;
 151                 }
 152         }
 153
 154         for (auto i: _ffmpeg_content->ffmpeg_audio_streams ()) {
 155                 auto a = audio->stream_position(film(), i);
 156                 /* Unfortunately if a is 0 that really means that we don't know the stream position since
 157                    there has been no data on it since the last seek.  In this case we'll just do nothing
 158                    here.  I'm not sure if that's the right idea.
 159                 */
 160                 if (a > ContentTime()) {
 161                         while (a < full_length) {
 162                                 auto to_do = min (full_length - a, ContentTime::from_seconds (0.1));
 163                                 auto silence = make_shared<AudioBuffers>(i->channels(), to_do.frames_ceil (i->frame_rate()));
 164                                 silence->make_silent ();
 165                                 audio->emit (film(), i, silence, a, true);
 166                                 a += to_do;
 167                         }
 168                 }
 169         }
 170
 171         if (audio) {
 172                 audio->flush ();
 173         }
 174
 175         return true;
 176 }
 177
 178
 179 bool
 180 FFmpegDecoder::pass ()
 181 {
 182         auto packet = av_packet_alloc();
 183         DCPOMATIC_ASSERT (packet);
 184
 185         int r = av_read_frame (_format_context, packet);
 186
 187         /* AVERROR_INVALIDDATA can apparently be returned sometimes even when av_read_frame
 188            has pretty-much succeeded (and hence generated data which should be processed).
 189            Hence it makes sense to continue here in that case.
 190         */
 191         if (r < 0 && r != AVERROR_INVALIDDATA) {
 192                 if (r != AVERROR_EOF) {
 193                         /* Maybe we should fail here, but for now we'll just finish off instead */
 194                         char buf[256];
 195                         av_strerror (r, buf, sizeof(buf));
 196                         LOG_ERROR (N_("error on av_read_frame (%1) (%2)"), &buf[0], r);
 197                 }
 198
 199                 av_packet_free (&packet);
 200                 return flush ();
 201         }
 202
 203         int const si = packet->stream_index;
 204         auto fc = _ffmpeg_content;
 205
 206         if (_video_stream && si == _video_stream.get() && video && !video->ignore()) {
 207                 decode_and_process_video_packet (packet);
 208         } else if (fc->subtitle_stream() && fc->subtitle_stream()->uses_index(_format_context, si) && !only_text()->ignore()) {
 209                 decode_and_process_subtitle_packet (packet);
 210         } else {
 211                 decode_and_process_audio_packet (packet);
 212         }
 213
 214         av_packet_free (&packet);
 215         return false;
 216 }
 217
 218
 219 /** @param data pointer to array of pointers to buffers.
 220  *  Only the first buffer will be used for non-planar data, otherwise there will be one per channel.
 221  */
 222 shared_ptr<AudioBuffers>
 223 FFmpegDecoder::deinterleave_audio (AVFrame* frame)
 224 {
 225         auto format = static_cast<AVSampleFormat>(frame->format);
 226
 227         /* XXX: can't we use swr_convert() to do the format conversion? */
 228
 229         int const channels = frame->channels;
 230         int const frames = frame->nb_samples;
 231         int const total_samples = frames * channels;
 232         auto audio = make_shared<AudioBuffers>(channels, frames);
 233         auto data = audio->data();
 234
 235         switch (format) {
 236         case AV_SAMPLE_FMT_U8:
 237         {
 238                 auto p = reinterpret_cast<uint8_t *> (frame->data[0]);
 239                 int sample = 0;
 240                 int channel = 0;
 241                 for (int i = 0; i < total_samples; ++i) {
 242                         data[channel][sample] = float(*p++) / (1 << 23);
 243
 244                         ++channel;
 245                         if (channel == channels) {
 246                                 channel = 0;
 247                                 ++sample;
 248                         }
 249                 }
 250         }
 251         break;
 252
 253         case AV_SAMPLE_FMT_S16:
 254         {
 255                 auto p = reinterpret_cast<int16_t *> (frame->data[0]);
 256                 int sample = 0;
 257                 int channel = 0;
 258                 for (int i = 0; i < total_samples; ++i) {
 259                         data[channel][sample] = float(*p++) / (1 << 15);
 260
 261                         ++channel;
 262                         if (channel == channels) {
 263                                 channel = 0;
 264                                 ++sample;
 265                         }
 266                 }
 267         }
 268         break;
 269
 270         case AV_SAMPLE_FMT_S16P:
 271         {
 272                 auto p = reinterpret_cast<int16_t **> (frame->data);
 273                 for (int i = 0; i < channels; ++i) {
 274                         for (int j = 0; j < frames; ++j) {
 275                                 data[i][j] = static_cast<float>(p[i][j]) / (1 << 15);
 276                         }
 277                 }
 278         }
 279         break;
 280
 281         case AV_SAMPLE_FMT_S32:
 282         {
 283                 auto p = reinterpret_cast<int32_t *> (frame->data[0]);
 284                 int sample = 0;
 285                 int channel = 0;
 286                 for (int i = 0; i < total_samples; ++i) {
 287                         data[channel][sample] = static_cast<float>(*p++) / 2147483648;
 288
 289                         ++channel;
 290                         if (channel == channels) {
 291                                 channel = 0;
 292                                 ++sample;
 293                         }
 294                 }
 295         }
 296         break;
 297
 298         case AV_SAMPLE_FMT_S32P:
 299         {
 300                 auto p = reinterpret_cast<int32_t **> (frame->data);
 301                 for (int i = 0; i < channels; ++i) {
 302                         for (int j = 0; j < frames; ++j) {
 303                                 data[i][j] = static_cast<float>(p[i][j]) / 2147483648;
 304                         }
 305                 }
 306         }
 307         break;
 308
 309         case AV_SAMPLE_FMT_FLT:
 310         {
 311                 auto p = reinterpret_cast<float*> (frame->data[0]);
 312                 int sample = 0;
 313                 int channel = 0;
 314                 for (int i = 0; i < total_samples; ++i) {
 315                         data[channel][sample] = *p++;
 316
 317                         ++channel;
 318                         if (channel == channels) {
 319                                 channel = 0;
 320                                 ++sample;
 321                         }
 322                 }
 323         }
 324         break;
 325
 326         case AV_SAMPLE_FMT_FLTP:
 327         {
 328                 auto p = reinterpret_cast<float**> (frame->data);
 329                 DCPOMATIC_ASSERT (frame->channels <= channels);
 330                 /* Sometimes there aren't as many channels in the frame as in the stream */
 331                 for (int i = 0; i < frame->channels; ++i) {
 332                         memcpy (data[i], p[i], frames * sizeof(float));
 333                 }
 334                 for (int i = frame->channels; i < channels; ++i) {
 335                         audio->make_silent (i);
 336                 }
 337         }
 338         break;
 339
 340         default:
 341                 throw DecodeError (String::compose(_("Unrecognised audio sample format (%1)"), static_cast<int>(format)));
 342         }
 343
 344         return audio;
 345 }
 346
 347
 348 AVSampleFormat
 349 FFmpegDecoder::audio_sample_format (shared_ptr<FFmpegAudioStream> stream) const
 350 {
 351         return static_cast<AVSampleFormat>(stream->stream(_format_context)->codecpar->format);
 352 }
 353
 354
 355 int
 356 FFmpegDecoder::bytes_per_audio_sample (shared_ptr<FFmpegAudioStream> stream) const
 357 {
 358         return av_get_bytes_per_sample (audio_sample_format (stream));
 359 }
 360
 361
 362 void
 363 FFmpegDecoder::seek (ContentTime time, bool accurate)
 364 {
 365         Decoder::seek (time, accurate);
 366
 367         /* If we are doing an `accurate' seek, we need to use pre-roll, as
 368            we don't really know what the seek will give us.
 369         */
 370
 371         auto pre_roll = accurate ? ContentTime::from_seconds (2) : ContentTime (0);
 372         time -= pre_roll;
 373
 374         /* XXX: it seems debatable whether PTS should be used here...
 375            http://www.mjbshaw.com/2012/04/seeking-in-ffmpeg-know-your-timestamp.html
 376         */
 377
 378         optional<int> stream;
 379
 380         if (_video_stream) {
 381                 stream = _video_stream;
 382         } else {
 383                 DCPOMATIC_ASSERT (_ffmpeg_content->audio);
 384                 auto s = dynamic_pointer_cast<FFmpegAudioStream>(_ffmpeg_content->audio->stream());
 385                 if (s) {
 386                         stream = s->index (_format_context);
 387                 }
 388         }
 389
 390         DCPOMATIC_ASSERT (stream);
 391
 392         auto u = time - _pts_offset;
 393         if (u < ContentTime ()) {
 394                 u = ContentTime ();
 395         }
 396         av_seek_frame (
 397                 _format_context,
 398                 stream.get(),
 399                 u.seconds() / av_q2d (_format_context->streams[stream.get()]->time_base),
 400                 AVSEEK_FLAG_BACKWARD
 401                 );
 402
 403         {
 404                 /* Force re-creation of filter graphs to reset them and hence to make sure
 405                    they don't have any pre-seek frames knocking about.
 406                 */
 407                 boost::mutex::scoped_lock lm (_filter_graphs_mutex);
 408                 _filter_graphs.clear ();
 409         }
 410
 411         if (video_codec_context ()) {
 412                 avcodec_flush_buffers (video_codec_context());
 413         }
 414
 415         for (auto i: ffmpeg_content()->ffmpeg_audio_streams()) {
 416                 avcodec_flush_buffers (_codec_context[i->index(_format_context)]);
 417         }
 418
 419         if (subtitle_codec_context ()) {
 420                 avcodec_flush_buffers (subtitle_codec_context ());
 421         }
 422
 423         _have_current_subtitle = false;
 424
 425         for (auto& i: _next_time) {
 426                 i.second = boost::optional<dcpomatic::ContentTime>();
 427         }
 428 }
 429
 430
 431 shared_ptr<FFmpegAudioStream>
 432 FFmpegDecoder::audio_stream_from_index (int index) const
 433 {
 434         /* XXX: inefficient */
 435         auto streams = ffmpeg_content()->ffmpeg_audio_streams();
 436         auto stream = streams.begin();
 437         while (stream != streams.end() && !(*stream)->uses_index(_format_context, index)) {
 438                 ++stream;
 439         }
 440
 441         if (stream == streams.end ()) {
 442                 return {};
 443         }
 444
 445         return *stream;
 446 }
 447
 448
 449 void
 450 FFmpegDecoder::process_audio_frame (shared_ptr<FFmpegAudioStream> stream)
 451 {
 452         auto frame = audio_frame (stream);
 453         auto data = deinterleave_audio (frame);
 454
 455         ContentTime ct;
 456         if (frame->pts == AV_NOPTS_VALUE) {
 457                 /* In some streams we see not every frame coming through with a timestamp; for those
 458                    that have AV_NOPTS_VALUE we need to work out the timestamp ourselves.  This is
 459                    particularly noticeable with TrueHD streams (see #1111).
 460                    */
 461                 if (_next_time[stream]) {
 462                         ct = *_next_time[stream];
 463                 }
 464         } else {
 465                 ct = ContentTime::from_seconds (
 466                         frame->best_effort_timestamp *
 467                         av_q2d (stream->stream(_format_context)->time_base))
 468                         + _pts_offset;
 469         }
 470
 471         _next_time[stream] = ct + ContentTime::from_frames(data->frames(), stream->frame_rate());
 472
 473         if (ct < ContentTime()) {
 474                 /* Discard audio data that comes before time 0 */
 475                 auto const remove = min (int64_t(data->frames()), (-ct).frames_ceil(double(stream->frame_rate())));
 476                 data->move (data->frames() - remove, remove, 0);
 477                 data->set_frames (data->frames() - remove);
 478                 ct += ContentTime::from_frames (remove, stream->frame_rate());
 479         }
 480
 481         if (ct < ContentTime()) {
 482                 LOG_WARNING (
 483                         "Crazy timestamp %1 for %2 samples in stream %3 (ts=%4 tb=%5, off=%6)",
 484                         to_string(ct),
 485                         data->frames(),
 486                         stream->id(),
 487                         frame->best_effort_timestamp,
 488                         av_q2d(stream->stream(_format_context)->time_base),
 489                         to_string(_pts_offset)
 490                         );
 491         }
 492
 493         /* Give this data provided there is some, and its time is sane */
 494         if (ct >= ContentTime() && data->frames() > 0) {
 495                 audio->emit (film(), stream, data, ct);
 496         }
 497 }
 498
 499
 500 void
 501 FFmpegDecoder::decode_and_process_audio_packet (AVPacket* packet)
 502 {
 503         auto stream = audio_stream_from_index (packet->stream_index);
 504         if (!stream) {
 505                 return;
 506         }
 507
 508         auto context = _codec_context[stream->index(_format_context)];
 509         auto frame = audio_frame (stream);
 510
 511         int r = avcodec_send_packet (context, packet);
 512         if (r < 0) {
 513                 LOG_WARNING("avcodec_send_packet returned %1 for an audio packet", r);
 514         }
 515         while (r >= 0) {
 516                 r = avcodec_receive_frame (context, frame);
 517                 if (r == AVERROR(EAGAIN)) {
 518                         /* More input is required */
 519                         return;
 520                 }
 521
 522                 /* We choose to be relaxed here about other errors; it seems that there may be valid
 523                  * data to decode even if an error occurred.  #352 may be related (though this was
 524                  * when we were using an old version of the FFmpeg API).
 525                  */
 526                 process_audio_frame (stream);
 527         }
 528 }
 529
 530
 531 bool
 532 FFmpegDecoder::decode_and_process_video_packet (AVPacket* packet)
 533 {
 534         DCPOMATIC_ASSERT (_video_stream);
 535
 536         auto context = video_codec_context();
 537
 538         bool pending = false;
 539         do {
 540                 int r = avcodec_send_packet (context, packet);
 541                 if (r < 0) {
 542                         LOG_WARNING("avcodec_send_packet returned %1 for a video packet", r);
 543                 }
 544
 545                 /* EAGAIN means we should call avcodec_receive_frame and then re-send the same packet */
 546                 pending = r == AVERROR(EAGAIN);
 547
 548                 while (true) {
 549                         r = avcodec_receive_frame (context, _video_frame);
 550                         if (r == AVERROR(EAGAIN) || r == AVERROR_EOF || (r < 0 && !packet)) {
 551                                 /* More input is required, no more frames are coming, or we are flushing and there was
 552                                  * some error which we just want to ignore.
 553                                  */
 554                                 return false;
 555                         } else if (r < 0) {
 556                                 throw DecodeError (N_("avcodec_receive_frame"), N_("FFmpeg::decode_and_process_video_packet"), r);
 557                         }
 558
 559                         process_video_frame ();
 560                 }
 561         } while (pending);
 562
 563         return true;
 564 }
 565
 566
 567 void
 568 FFmpegDecoder::process_video_frame ()
 569 {
 570         boost::mutex::scoped_lock lm (_filter_graphs_mutex);
 571
 572         shared_ptr<VideoFilterGraph> graph;
 573
 574         auto i = _filter_graphs.begin();
 575         while (i != _filter_graphs.end() && !(*i)->can_process(dcp::Size(_video_frame->width, _video_frame->height), (AVPixelFormat) _video_frame->format)) {
 576                 ++i;
 577         }
 578
 579         if (i == _filter_graphs.end ()) {
 580                 dcp::Fraction vfr (lrint(_ffmpeg_content->video_frame_rate().get() * 1000), 1000);
 581                 graph = make_shared<VideoFilterGraph>(dcp::Size(_video_frame->width, _video_frame->height), (AVPixelFormat) _video_frame->format, vfr);
 582                 graph->setup (_ffmpeg_content->filters ());
 583                 _filter_graphs.push_back (graph);
 584                 LOG_GENERAL (N_("New graph for %1x%2, pixel format %3"), _video_frame->width, _video_frame->height, _video_frame->format);
 585         } else {
 586                 graph = *i;
 587         }
 588
 589         auto images = graph->process (_video_frame);
 590
 591         for (auto const& i: images) {
 592
 593                 auto image = i.first;
 594
 595                 if (i.second != AV_NOPTS_VALUE) {
 596                         double const pts = i.second * av_q2d(_format_context->streams[_video_stream.get()]->time_base) + _pts_offset.seconds();
 597
 598                         video->emit (
 599                                 film(),
 600                                 make_shared<RawImageProxy>(image),
 601                                 llrint(pts * _ffmpeg_content->active_video_frame_rate(film()))
 602                                 );
 603                 } else {
 604                         LOG_WARNING_NC ("Dropping frame without PTS");
 605                 }
 606         }
 607 }
 608
 609
 610 void
 611 FFmpegDecoder::decode_and_process_subtitle_packet (AVPacket* packet)
 612 {
 613         int got_subtitle;
 614         AVSubtitle sub;
 615         if (avcodec_decode_subtitle2 (subtitle_codec_context(), &sub, &got_subtitle, packet) < 0 || !got_subtitle) {
 616                 return;
 617         }
 618
 619         auto sub_period = subtitle_period (packet, ffmpeg_content()->subtitle_stream()->stream(_format_context), sub);
 620
 621         /* Stop any current subtitle, either at the time it was supposed to stop, or now if now is sooner */
 622         if (_have_current_subtitle) {
 623                 if (_current_subtitle_to) {
 624                         only_text()->emit_stop (min(*_current_subtitle_to, sub_period.from + _pts_offset));
 625                 } else {
 626                         only_text()->emit_stop (sub_period.from + _pts_offset);
 627                 }
 628                 _have_current_subtitle = false;
 629         }
 630
 631         if (sub.num_rects <= 0) {
 632                 /* Nothing new in this subtitle */
 633                 avsubtitle_free (&sub);
 634                 return;
 635         }
 636
 637         /* Subtitle PTS (within the source, not taking into account any of the
 638            source that we may have chopped off for the DCP).
 639         */
 640         ContentTime from;
 641         from = sub_period.from + _pts_offset;
 642         if (sub_period.to) {
 643                 _current_subtitle_to = *sub_period.to + _pts_offset;
 644         } else {
 645                 _current_subtitle_to = optional<ContentTime>();
 646                 _have_current_subtitle = true;
 647         }
 648
 649         ContentBitmapText bitmap_text(from);
 650         for (unsigned int i = 0; i < sub.num_rects; ++i) {
 651                 auto const rect = sub.rects[i];
 652
 653                 switch (rect->type) {
 654                 case SUBTITLE_NONE:
 655                         break;
 656                 case SUBTITLE_BITMAP:
 657                         bitmap_text.subs.push_back(process_bitmap_subtitle(rect));
 658                         break;
 659                 case SUBTITLE_TEXT:
 660                         cout << "XXX: SUBTITLE_TEXT " << rect->text << "\n";
 661                         break;
 662                 case SUBTITLE_ASS:
 663                         process_ass_subtitle (rect->ass, from);
 664                         break;
 665                 }
 666         }
 667
 668         if (!bitmap_text.subs.empty()) {
 669                 only_text()->emit_bitmap_start(bitmap_text);
 670         }
 671
 672         if (_current_subtitle_to) {
 673                 only_text()->emit_stop (*_current_subtitle_to);
 674         }
 675
 676         avsubtitle_free (&sub);
 677 }
 678
 679
 680 BitmapText
 681 FFmpegDecoder::process_bitmap_subtitle (AVSubtitleRect const * rect)
 682 {
 683         /* Note BGRA is expressed little-endian, so the first byte in the word is B, second
 684            G, third R, fourth A.
 685         */
 686         auto image = make_shared<Image>(AV_PIX_FMT_BGRA, dcp::Size (rect->w, rect->h), Image::Alignment::PADDED);
 687
 688 #ifdef DCPOMATIC_HAVE_AVSUBTITLERECT_PICT
 689         /* Start of the first line in the subtitle */
 690         auto sub_p = rect->pict.data[0];
 691         /* sub_p looks up into a BGRA palette which is at rect->pict.data[1];
 692            (i.e. first byte B, second G, third R, fourth A)
 693         */
 694         auto const palette = rect->pict.data[1];
 695 #else
 696         /* Start of the first line in the subtitle */
 697         auto sub_p = rect->data[0];
 698         /* sub_p looks up into a BGRA palette which is at rect->data[1].
 699            (first byte B, second G, third R, fourth A)
 700         */
 701         auto const* palette = rect->data[1];
 702 #endif
 703         /* And the stream has a map of those palette colours to colours
 704            chosen by the user; created a `mapped' palette from those settings.
 705         */
 706         auto colour_map = ffmpeg_content()->subtitle_stream()->colours();
 707         vector<RGBA> mapped_palette (rect->nb_colors);
 708         for (int i = 0; i < rect->nb_colors; ++i) {
 709                 RGBA c (palette[2], palette[1], palette[0], palette[3]);
 710                 auto j = colour_map.find (c);
 711                 if (j != colour_map.end ()) {
 712                         mapped_palette[i] = j->second;
 713                 } else {
 714                         /* This colour was not found in the FFmpegSubtitleStream's colour map; probably because
 715                            it is from a project that was created before this stuff was added.  Just use the
 716                            colour straight from the original palette.
 717                         */
 718                         mapped_palette[i] = c;
 719                 }
 720                 palette += 4;
 721         }
 722
 723         /* Start of the output data */
 724         auto out_p = image->data()[0];
 725
 726         for (int y = 0; y < rect->h; ++y) {
 727                 auto sub_line_p = sub_p;
 728                 auto out_line_p = out_p;
 729                 for (int x = 0; x < rect->w; ++x) {
 730                         auto const p = mapped_palette[*sub_line_p++];
 731                         *out_line_p++ = p.b;
 732                         *out_line_p++ = p.g;
 733                         *out_line_p++ = p.r;
 734                         *out_line_p++ = p.a;
 735                 }
 736 #ifdef DCPOMATIC_HAVE_AVSUBTITLERECT_PICT
 737                 sub_p += rect->pict.linesize[0];
 738 #else
 739                 sub_p += rect->linesize[0];
 740 #endif
 741                 out_p += image->stride()[0];
 742         }
 743
 744         int target_width = subtitle_codec_context()->width;
 745         if (target_width == 0 && video_codec_context()) {
 746                 /* subtitle_codec_context()->width == 0 has been seen in the wild but I don't
 747                    know if it's supposed to mean something from FFmpeg's point of view.
 748                 */
 749                 target_width = video_codec_context()->width;
 750         }
 751         int target_height = subtitle_codec_context()->height;
 752         if (target_height == 0 && video_codec_context()) {
 753                 target_height = video_codec_context()->height;
 754         }
 755         DCPOMATIC_ASSERT (target_width);
 756         DCPOMATIC_ASSERT (target_height);
 757         dcpomatic::Rect<double> const scaled_rect (
 758                 static_cast<double>(rect->x) / target_width,
 759                 static_cast<double>(rect->y) / target_height,
 760                 static_cast<double>(rect->w) / target_width,
 761                 static_cast<double>(rect->h) / target_height
 762                 );
 763
 764         return { image, scaled_rect };
 765 }
 766
 767
 768 void
 769 FFmpegDecoder::process_ass_subtitle (string ass, ContentTime from)
 770 {
 771         /* We have no styles and no Format: line, so I'm assuming that FFmpeg
 772            produces a single format of Dialogue: lines...
 773         */
 774
 775         int commas = 0;
 776         string text;
 777         for (size_t i = 0; i < ass.length(); ++i) {
 778                 if (commas < 9 && ass[i] == ',') {
 779                         ++commas;
 780                 } else if (commas == 9) {
 781                         text += ass[i];
 782                 }
 783         }
 784
 785         if (text.empty ()) {
 786                 return;
 787         }
 788
 789         sub::RawSubtitle base;
 790         auto raw = sub::SSAReader::parse_line (
 791                 base,
 792                 text,
 793                 _ffmpeg_content->video->size().width,
 794                 _ffmpeg_content->video->size().height
 795                 );
 796
 797         for (auto const& i: sub::collect<vector<sub::Subtitle>>(raw)) {
 798                 only_text()->emit_plain_start (from, i);
 799         }
 800 }