2 Copyright (C) 2012 Carl Hetherington <cth@carlh.net>
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2 of the License, or
7 (at your option) any later version.
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
20 /** @file src/image.cc
21 * @brief A set of classes to describe video images.
30 #include <boost/algorithm/string.hpp>
33 #include <libavcodec/avcodec.h>
34 #include <libavformat/avformat.h>
35 #include <libswscale/swscale.h>
36 #include <libswresample/swresample.h>
37 #include <libavfilter/avfiltergraph.h>
38 #include <libavfilter/avcodec.h>
39 #include <libavfilter/buffersink.h>
40 #include <libpostproc/postprocess.h>
41 #include <libavutil/pixfmt.h>
44 #include "exceptions.h"
52 using namespace boost;
54 /** @param n Component index.
55 * @return Number of lines in the image for the given component.
58 Image::lines (int n) const
60 switch (_pixel_format) {
65 return size().height / 2;
77 /** @return Number of components */
79 Image::components () const
81 switch (_pixel_format) {
94 /** Write a MD5 hash of the image's data to stdout.
95 * @param n Title to give the output.
98 Image::hash (string n) const
100 MHASH ht = mhash_init (MHASH_MD5);
101 if (ht == MHASH_FAILED) {
102 throw EncodeError ("could not create hash thread");
105 for (int i = 0; i < components(); ++i) {
106 mhash (ht, data()[i], line_size()[i] * lines(i));
110 mhash_deinit (ht, hash);
112 printf ("%s: ", n.c_str ());
113 for (int i = 0; i < int (mhash_get_block_size (MHASH_MD5)); ++i) {
114 printf ("%.2x", hash[i]);
120 /** Scale this image to a given size and convert it to RGB.
121 * @param out_size Output image size in pixels.
122 * @param scaler Scaler to use.
124 shared_ptr<RGBFrameImage>
125 Image::scale_and_convert_to_rgb (Size out_size, int padding, Scaler const * scaler) const
129 Size content_size = out_size;
130 content_size.width -= (padding * 2);
132 shared_ptr<RGBFrameImage> rgb (new RGBFrameImage (content_size));
134 struct SwsContext* scale_context = sws_getContext (
135 size().width, size().height, pixel_format(),
136 content_size.width, content_size.height, PIX_FMT_RGB24,
137 scaler->ffmpeg_id (), 0, 0, 0
140 /* Scale and convert to RGB from whatever its currently in (which may be RGB) */
145 rgb->data (), rgb->line_size ()
148 /* Put the image in the right place in a black frame if are padding; this is
149 a bit grubby and expensive, but probably inconsequential in the great
153 shared_ptr<RGBFrameImage> padded_rgb (new RGBFrameImage (out_size));
154 padded_rgb->make_black ();
156 /* XXX: we are cheating a bit here; we know the frame is RGB so we can
157 make assumptions about its composition.
159 uint8_t* p = padded_rgb->data()[0] + padding * 3;
160 uint8_t* q = rgb->data()[0];
161 for (int j = 0; j < rgb->lines(0); ++j) {
162 memcpy (p, q, rgb->line_size()[0]);
163 p += padded_rgb->line_size()[0];
164 q += rgb->line_size()[0];
170 sws_freeContext (scale_context);
175 /** Run a FFmpeg post-process on this image and return the processed version.
176 * @param pp Flags for the required set of post processes.
177 * @return Post-processed image.
179 shared_ptr<PostProcessImage>
180 Image::post_process (string pp) const
182 shared_ptr<PostProcessImage> out (new PostProcessImage (PIX_FMT_YUV420P, size ()));
184 pp_mode* mode = pp_get_mode_by_name_and_quality (pp.c_str (), PP_QUALITY_MAX);
185 pp_context* context = pp_get_context (size().width, size().height, PP_FORMAT_420 | PP_CPU_CAPS_MMX2);
188 (const uint8_t **) data(), line_size(),
189 out->data(), out->line_size(),
190 size().width, size().height,
191 0, 0, mode, context, 0
195 pp_free_context (context);
203 switch (_pixel_format) {
204 case PIX_FMT_YUV420P:
205 memset (data()[0], 0, lines(0) * line_size()[0]);
206 memset (data()[1], 0x80, lines(1) * line_size()[1]);
207 memset (data()[2], 0x80, lines(2) * line_size()[2]);
211 memset (data()[0], 0, lines(0) * line_size()[0]);
219 /** Construct a SimpleImage of a given size and format, allocating memory
222 * @param p Pixel format.
223 * @param s Size in pixels.
225 SimpleImage::SimpleImage (PixelFormat p, Size s)
229 _data = (uint8_t **) av_malloc (components() * sizeof (uint8_t *));
230 _line_size = (int *) av_malloc (components() * sizeof (int));
232 for (int i = 0; i < components(); ++i) {
238 /** Destroy a SimpleImage */
239 SimpleImage::~SimpleImage ()
241 for (int i = 0; i < components(); ++i) {
246 av_free (_line_size);
249 /** Set the size in bytes of each horizontal line of a given component.
250 * @param i Component index.
251 * @param s Size of line in bytes.
254 SimpleImage::set_line_size (int i, int s)
257 _data[i] = (uint8_t *) av_malloc (s * lines (i));
261 SimpleImage::data () const
267 SimpleImage::line_size () const
273 SimpleImage::size () const
279 FilterBufferImage::FilterBufferImage (PixelFormat p, AVFilterBufferRef* b)
286 FilterBufferImage::~FilterBufferImage ()
288 avfilter_unref_buffer (_buffer);
292 FilterBufferImage::data () const
294 return _buffer->data;
298 FilterBufferImage::line_size () const
300 return _buffer->linesize;
304 FilterBufferImage::size () const
306 return Size (_buffer->video->w, _buffer->video->h);
309 /** XXX: this could be generalised to use any format, but I don't
310 * understand how avpicture_fill is supposed to be called with
311 * multi-planar images.
313 RGBFrameImage::RGBFrameImage (Size s)
314 : Image (PIX_FMT_RGB24)
317 _frame = avcodec_alloc_frame ();
319 throw EncodeError ("could not allocate frame");
322 _data = (uint8_t *) av_malloc (size().width * size().height * 3);
323 avpicture_fill ((AVPicture *) _frame, _data, PIX_FMT_RGB24, size().width, size().height);
324 _frame->width = size().width;
325 _frame->height = size().height;
326 _frame->format = PIX_FMT_RGB24;
329 RGBFrameImage::~RGBFrameImage ()
336 RGBFrameImage::data () const
342 RGBFrameImage::line_size () const
344 return _frame->linesize;
348 RGBFrameImage::size () const
353 PostProcessImage::PostProcessImage (PixelFormat p, Size s)
357 _data = new uint8_t*[4];
358 _line_size = new int[4];
360 for (int i = 0; i < 4; ++i) {
361 _data[i] = (uint8_t *) av_malloc (s.width * s.height);
362 _line_size[i] = s.width;
366 PostProcessImage::~PostProcessImage ()
368 for (int i = 0; i < 4; ++i) {
377 PostProcessImage::data () const
383 PostProcessImage::line_size () const
389 PostProcessImage::size () const