2 * The copyright in this software is being made available under the 2-clauses
3 * BSD License, included below. This software may be subject to other third
4 * party and contributor rights, including patent rights, and no such rights
5 * are granted under this license.
7 * Copyright (c) 2002-2014, Universite catholique de Louvain (UCL), Belgium
8 * Copyright (c) 2002-2014, Professor Benoit Macq
9 * Copyright (c) 2001-2003, David Janssens
10 * Copyright (c) 2002-2003, Yannick Verschueren
11 * Copyright (c) 2003-2007, Francois-Olivier Devaux
12 * Copyright (c) 2003-2014, Antonin Descampe
13 * Copyright (c) 2005, Herve Drolon, FreeImage Team
14 * All rights reserved.
16 * Redistribution and use in source and binary forms, with or without
17 * modification, are permitted provided that the following conditions
19 * 1. Redistributions of source code must retain the above copyright
20 * notice, this list of conditions and the following disclaimer.
21 * 2. Redistributions in binary form must reproduce the above copyright
22 * notice, this list of conditions and the following disclaimer in the
23 * documentation and/or other materials provided with the distribution.
25 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS `AS IS'
26 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
27 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
28 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
29 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
30 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
31 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
32 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
33 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
34 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
35 * POSSIBILITY OF SUCH DAMAGE.
39 #include <xmmintrin.h>
42 #include "opj_includes.h"
45 /* This table contains the norms of the basis function of the reversible MCT. */
47 static const double mct_norms[3] = { 1.732, .8292, .8292 };
50 /* This table contains the norms of the basis function of the irreversible MCT. */
52 static const double mct_norms_real[3] = { 1.732, 1.805, 1.573 };
55 /* Forward reversible MCT. */
64 for(i = 0; i < n; ++i) {
68 int y = (r + (g * 2) + b) >> 2;
78 /* Inverse reversible MCT. */
87 for (i = 0; i < n; ++i) {
91 int g = y - ((u + v) >> 2);
101 /* Get norm of basis function of reversible MCT. */
103 double mct_getnorm(int compno) {
104 return mct_norms[compno];
108 /* Forward irreversible MCT. */
110 void mct_encode_real(
117 for(i = 0; i < n; ++i) {
121 int y = fix_mul(r, 2449) + fix_mul(g, 4809) + fix_mul(b, 934);
122 int u = -fix_mul(r, 1382) - fix_mul(g, 2714) + fix_mul(b, 4096);
123 int v = fix_mul(r, 4096) - fix_mul(g, 3430) - fix_mul(b, 666);
131 /* Inverse irreversible MCT. */
133 void mct_decode_real(
141 __m128 vrv, vgu, vgv, vbu;
142 vrv = _mm_set1_ps(1.402f);
143 vgu = _mm_set1_ps(0.34413f);
144 vgv = _mm_set1_ps(0.71414f);
145 vbu = _mm_set1_ps(1.772f);
146 for (i = 0; i < (n >> 3); ++i) {
150 vy = _mm_load_ps(c0);
151 vu = _mm_load_ps(c1);
152 vv = _mm_load_ps(c2);
153 vr = _mm_add_ps(vy, _mm_mul_ps(vv, vrv));
154 vg = _mm_sub_ps(_mm_sub_ps(vy, _mm_mul_ps(vu, vgu)), _mm_mul_ps(vv, vgv));
155 vb = _mm_add_ps(vy, _mm_mul_ps(vu, vbu));
156 _mm_store_ps(c0, vr);
157 _mm_store_ps(c1, vg);
158 _mm_store_ps(c2, vb);
163 vy = _mm_load_ps(c0);
164 vu = _mm_load_ps(c1);
165 vv = _mm_load_ps(c2);
166 vr = _mm_add_ps(vy, _mm_mul_ps(vv, vrv));
167 vg = _mm_sub_ps(_mm_sub_ps(vy, _mm_mul_ps(vu, vgu)), _mm_mul_ps(vv, vgv));
168 vb = _mm_add_ps(vy, _mm_mul_ps(vu, vbu));
169 _mm_store_ps(c0, vr);
170 _mm_store_ps(c1, vg);
171 _mm_store_ps(c2, vb);
178 for(i = 0; i < n; ++i) {
182 float r = y + (v * 1.402f);
183 float g = y - (u * 0.34413f) - (v * (0.71414f));
184 float b = y + (u * 1.772f);
192 /* Get norm of basis function of irreversible MCT. */
194 double mct_getnorm_real(int compno) {
195 return mct_norms_real[compno];