OpenJPH
Open-source implementation of JPEG2000 Part-15
Loading...
Searching...
No Matches
ojph_colour.cpp
Go to the documentation of this file.
1//***************************************************************************/
2// This software is released under the 2-Clause BSD license, included
3// below.
4//
5// Copyright (c) 2019, Aous Naman
6// Copyright (c) 2019, Kakadu Software Pty Ltd, Australia
7// Copyright (c) 2019, The University of New South Wales, Australia
8//
9// Redistribution and use in source and binary forms, with or without
10// modification, are permitted provided that the following conditions are
11// met:
12//
13// 1. Redistributions of source code must retain the above copyright
14// notice, this list of conditions and the following disclaimer.
15//
16// 2. Redistributions in binary form must reproduce the above copyright
17// notice, this list of conditions and the following disclaimer in the
18// documentation and/or other materials provided with the distribution.
19//
20// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
21// IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
22// TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
23// PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
24// HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
25// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
26// TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
27// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
28// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
29// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
30// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
31//***************************************************************************/
32// This file is part of the OpenJPH software implementation.
33// File: ojph_colour.cpp
34// Author: Aous Naman
35// Date: 28 August 2019
36//***************************************************************************/
37
38#include <cmath>
39
40#include "ojph_defs.h"
41#include "ojph_arch.h"
42#include "ojph_mem.h"
43#include "ojph_colour.h"
44#include "ojph_colour_local.h"
45
46namespace ojph {
47
48 // defined elsewhere
49 class line_buf;
50
51 namespace local {
52
55 (const line_buf *src_line, const ui32 src_line_offset,
56 line_buf *dst_line, const ui32 dst_line_offset,
57 si64 shift, ui32 width) = NULL;
58
61 (const line_buf *src_line, const ui32 src_line_offset,
62 line_buf *dst_line, const ui32 dst_line_offset,
63 si64 shift, ui32 width) = NULL;
64
67 (const si32 *sp, float *dp, float mul, ui32 width) = NULL;
68
71 (const si32 *sp, float *dp, float mul, ui32 width) = NULL;
72
75 (const float *sp, si32 *dp, float mul, ui32 width) = NULL;
76
79 (const float *sp, si32 *dp, float mul, ui32 width) = NULL;
80
83 (const line_buf* r, const line_buf* g, const line_buf* b,
84 line_buf* y, line_buf* cb, line_buf* cr, ui32 repeat) = NULL;
85
88 (const line_buf* r, const line_buf* g, const line_buf* b,
89 line_buf* y, line_buf* cb, line_buf* cr, ui32 repeat) = NULL;
90
93 (const float *r, const float *g, const float *b,
94 float *y, float *cb, float *cr, ui32 repeat) = NULL;
95
98 (const float *y, const float *cb, const float *cr,
99 float *r, float *g, float *b, ui32 repeat) = NULL;
100
103
106 {
108 return;
109
110#if !defined(OJPH_ENABLE_WASM_SIMD) || !defined(OJPH_EMSCRIPTEN)
111
122
123 #ifndef OJPH_DISABLE_SIMD
124
125 #if (defined(OJPH_ARCH_X86_64) || defined(OJPH_ARCH_I386))
126
127 #ifndef OJPH_DISABLE_SSE
129 {
136 }
137 #endif // !OJPH_DISABLE_SSE
138
139 #ifndef OJPH_DISABLE_SSE2
141 {
148 }
149 #endif // !OJPH_DISABLE_SSE2
150
151 #ifndef OJPH_DISABLE_AVX
153 {
160 }
161 #endif // !OJPH_DISABLE_AVX
162
163 #ifndef OJPH_DISABLE_AVX2
165 {
170 }
171 #endif // !OJPH_DISABLE_AVX2
172
173 #elif defined(OJPH_ARCH_ARM)
174
175 #endif // !(defined(OJPH_ARCH_X86_64) || defined(OJPH_ARCH_I386))
176
177 #endif // !OJPH_DISABLE_SIMD
178
179#else // OJPH_ENABLE_WASM_SIMD
180
191
192#endif // !OJPH_ENABLE_WASM_SIMD
193
195 }
196
198 const float CT_CNST::ALPHA_RF = 0.299f;
199 const float CT_CNST::ALPHA_GF = 0.587f;
200 const float CT_CNST::ALPHA_BF = 0.114f;
201 const float CT_CNST::BETA_CbF = float(0.5/(1-double(CT_CNST::ALPHA_BF)));
202 const float CT_CNST::BETA_CrF = float(0.5/(1-double(CT_CNST::ALPHA_RF)));
203 const float CT_CNST::GAMMA_CB2G =
204 float(2.0*double(ALPHA_BF)*(1.0-double(ALPHA_BF))/double(ALPHA_GF));
205 const float CT_CNST::GAMMA_CR2G =
206 float(2.0*double(ALPHA_RF)*(1.0-double(ALPHA_RF))/double(ALPHA_GF));
207 const float CT_CNST::GAMMA_CB2B = float(2.0 * (1.0 - double(ALPHA_BF)));
208 const float CT_CNST::GAMMA_CR2R = float(2.0 * (1.0 - double(ALPHA_RF)));
209
211
212#if !defined(OJPH_ENABLE_WASM_SIMD) || !defined(OJPH_EMSCRIPTEN)
213
216 const line_buf *src_line, const ui32 src_line_offset,
217 line_buf *dst_line, const ui32 dst_line_offset,
218 si64 shift, ui32 width)
219 {
220 if (src_line->flags & line_buf::LFT_32BIT)
221 {
222 if (dst_line->flags & line_buf::LFT_32BIT)
223 {
224 const si32 *sp = src_line->i32 + src_line_offset;
225 si32 *dp = dst_line->i32 + dst_line_offset;
226 si32 s = (si32)shift;
227 for (ui32 i = width; i > 0; --i)
228 *dp++ = *sp++ + s;
229 }
230 else
231 {
232 const si32 *sp = src_line->i32 + src_line_offset;
233 si64 *dp = dst_line->i64 + dst_line_offset;
234 for (ui32 i = width; i > 0; --i)
235 *dp++ = *sp++ + shift;
236 }
237 }
238 else
239 {
240 assert(src_line->flags | line_buf::LFT_64BIT);
241 assert(dst_line->flags | line_buf::LFT_32BIT);
242 const si64 *sp = src_line->i64 + src_line_offset;
243 si32 *dp = dst_line->i32 + dst_line_offset;
244 for (ui32 i = width; i > 0; --i)
245 *dp++ = (si32)(*sp++ + shift);
246 }
247 }
248
251 const line_buf *src_line, const ui32 src_line_offset,
252 line_buf *dst_line, const ui32 dst_line_offset,
253 si64 shift, ui32 width)
254 {
255 if (src_line->flags & line_buf::LFT_32BIT)
256 {
257 if (dst_line->flags & line_buf::LFT_32BIT)
258 {
259 const si32 *sp = src_line->i32 + src_line_offset;
260 si32 *dp = dst_line->i32 + dst_line_offset;
261 si32 s = (si32)shift;
262 for (ui32 i = width; i > 0; --i) {
263 const si32 v = *sp++;
264 *dp++ = v >= 0 ? v : (- v - s);
265 }
266 }
267 else
268 {
269 const si32 *sp = src_line->i32 + src_line_offset;
270 si64 *dp = dst_line->i64 + dst_line_offset;
271 for (ui32 i = width; i > 0; --i) {
272 const si64 v = *sp++;
273 *dp++ = v >= 0 ? v : (- v - shift);
274 }
275 }
276 }
277 else
278 {
279 assert(src_line->flags | line_buf::LFT_64BIT);
280 assert(dst_line->flags | line_buf::LFT_32BIT);
281 const si64 *sp = src_line->i64 + src_line_offset;
282 si32 *dp = dst_line->i32 + dst_line_offset;
283 for (ui32 i = width; i > 0; --i) {
284 const si64 v = *sp++;
285 *dp++ = (si32)(v >= 0 ? v : (- v - shift));
286 }
287 }
288 }
289
291 void gen_cnvrt_si32_to_float_shftd(const si32 *sp, float *dp, float mul,
292 ui32 width)
293 {
294 for (ui32 i = width; i > 0; --i)
295 *dp++ = (float)*sp++ * mul - 0.5f;
296 }
297
299 void gen_cnvrt_si32_to_float(const si32 *sp, float *dp, float mul,
300 ui32 width)
301 {
302 for (ui32 i = width; i > 0; --i)
303 *dp++ = (float)*sp++ * mul;
304 }
305
307 void gen_cnvrt_float_to_si32_shftd(const float *sp, si32 *dp, float mul,
308 ui32 width)
309 {
310 for (ui32 i = width; i > 0; --i)
311 *dp++ = ojph_round((*sp++ + 0.5f) * mul);
312 }
313
315 void gen_cnvrt_float_to_si32(const float *sp, si32 *dp, float mul,
316 ui32 width)
317 {
318 for (ui32 i = width; i > 0; --i)
319 *dp++ = ojph_round(*sp++ * mul);
320 }
321
324 const line_buf *r, const line_buf *g, const line_buf *b,
325 line_buf *y, line_buf *cb, line_buf *cr, ui32 repeat)
326 {
327 assert((y->flags & line_buf::LFT_REVERSIBLE) &&
333
334 if (y->flags & line_buf::LFT_32BIT)
335 {
336 assert((y->flags & line_buf::LFT_32BIT) &&
337 (cb->flags & line_buf::LFT_32BIT) &&
338 (cr->flags & line_buf::LFT_32BIT) &&
339 (r->flags & line_buf::LFT_32BIT) &&
340 (g->flags & line_buf::LFT_32BIT) &&
341 (b->flags & line_buf::LFT_32BIT));
342 const si32 *rp = r->i32, * gp = g->i32, * bp = b->i32;
343 si32 *yp = y->i32, * cbp = cb->i32, * crp = cr->i32;
344 for (ui32 i = repeat; i > 0; --i)
345 {
346 si32 rr = *rp++, gg = *gp++, bb = *bp++;
347 *yp++ = (rr + (gg << 1) + bb) >> 2;
348 *cbp++ = (bb - gg);
349 *crp++ = (rr - gg);
350 }
351 }
352 else
353 {
354 assert((y->flags & line_buf::LFT_64BIT) &&
355 (cb->flags & line_buf::LFT_64BIT) &&
356 (cr->flags & line_buf::LFT_64BIT) &&
357 (r->flags & line_buf::LFT_32BIT) &&
358 (g->flags & line_buf::LFT_32BIT) &&
360 const si32 *rp = r->i32, *gp = g->i32, *bp = b->i32;
361 si64 *yp = y->i64, *cbp = cb->i64, *crp = cr->i64;
362 for (ui32 i = repeat; i > 0; --i)
363 {
364 si64 rr = *rp++, gg = *gp++, bb = *bp++;
365 *yp++ = (rr + (gg << 1) + bb) >> 2;
366 *cbp++ = (bb - gg);
367 *crp++ = (rr - gg);
368 }
369 }
370 }
371
374 const line_buf *y, const line_buf *cb, const line_buf *cr,
375 line_buf *r, line_buf *g, line_buf *b, ui32 repeat)
376 {
377 assert((y->flags & line_buf::LFT_REVERSIBLE) &&
383
384 if (y->flags & line_buf::LFT_32BIT)
385 {
386 assert((y->flags & line_buf::LFT_32BIT) &&
387 (cb->flags & line_buf::LFT_32BIT) &&
388 (cr->flags & line_buf::LFT_32BIT) &&
389 (r->flags & line_buf::LFT_32BIT) &&
390 (g->flags & line_buf::LFT_32BIT) &&
392 const si32 *yp = y->i32, *cbp = cb->i32, *crp = cr->i32;
393 si32 *rp = r->i32, *gp = g->i32, *bp = b->i32;
394 for (ui32 i = repeat; i > 0; --i)
395 {
396 si32 yy = *yp++, cbb = *cbp++, crr = *crp++;
397 si32 gg = yy - ((cbb + crr) >> 2);
398 *rp++ = crr + gg;
399 *gp++ = gg;
400 *bp++ = cbb + gg;
401 }
402 }
403 else
404 {
405 assert((y->flags & line_buf::LFT_64BIT) &&
406 (cb->flags & line_buf::LFT_64BIT) &&
407 (cr->flags & line_buf::LFT_64BIT) &&
408 (r->flags & line_buf::LFT_32BIT) &&
409 (g->flags & line_buf::LFT_32BIT) &&
410 (b->flags & line_buf::LFT_32BIT));
411 const si64 *yp = y->i64, *cbp = cb->i64, *crp = cr->i64;
412 si32 *rp = r->i32, *gp = g->i32, *bp = b->i32;
413 for (ui32 i = repeat; i > 0; --i)
414 {
415 si64 yy = *yp++, cbb = *cbp++, crr = *crp++;
416 si64 gg = yy - ((cbb + crr) >> 2);
417 *rp++ = (si32)(crr + gg);
418 *gp++ = (si32)gg;
419 *bp++ = (si32)(cbb + gg);
420 }
421 }
422 }
423
425 void gen_ict_forward(const float *r, const float *g, const float *b,
426 float *y, float *cb, float *cr, ui32 repeat)
427 {
428 for (ui32 i = repeat; i > 0; --i)
429 {
430 *y = CT_CNST::ALPHA_RF * *r
431 + CT_CNST::ALPHA_GF * *g++
432 + CT_CNST::ALPHA_BF * *b;
433 *cb++ = CT_CNST::BETA_CbF * (*b++ - *y);
434 *cr++ = CT_CNST::BETA_CrF * (*r++ - *y++);
435 }
436 }
437
439 void gen_ict_backward(const float *y, const float *cb, const float *cr,
440 float *r, float *g, float *b, ui32 repeat)
441 {
442 for (ui32 i = repeat; i > 0; --i)
443 {
444 *g++ = *y - CT_CNST::GAMMA_CR2G * *cr - CT_CNST::GAMMA_CB2G * *cb;
445 *r++ = *y + CT_CNST::GAMMA_CR2R * *cr++;
446 *b++ = *y++ + CT_CNST::GAMMA_CB2B * *cb++;
447 }
448 }
449
450#endif // !OJPH_ENABLE_WASM_SIMD
451
452 }
453}
void wasm_cnvrt_float_to_si32_shftd(const float *sp, si32 *dp, float mul, ui32 width)
void(* cnvrt_float_to_si32)(const float *sp, si32 *dp, float mul, ui32 width)
void sse2_rct_backward(const line_buf *y, const line_buf *cb, const line_buf *cr, line_buf *r, line_buf *g, line_buf *b, ui32 repeat)
void wasm_ict_backward(const float *y, const float *cb, const float *cr, float *r, float *g, float *b, ui32 repeat)
void avx2_rct_forward(const line_buf *r, const line_buf *g, const line_buf *b, line_buf *y, line_buf *cb, line_buf *cr, ui32 repeat)
void wasm_rev_convert_nlt_type3(const line_buf *src_line, const ui32 src_line_offset, line_buf *dst_line, const ui32 dst_line_offset, si64 shift, ui32 width)
void(* rct_forward)(const line_buf *r, const line_buf *g, const line_buf *b, line_buf *y, line_buf *cb, line_buf *cr, ui32 repeat)
void wasm_cnvrt_si32_to_float_shftd(const si32 *sp, float *dp, float mul, ui32 width)
void avx_cnvrt_float_to_si32(const float *sp, si32 *dp, float mul, ui32 width)
void(* cnvrt_si32_to_float_shftd)(const si32 *sp, float *dp, float mul, ui32 width)
void(* ict_forward)(const float *r, const float *g, const float *b, float *y, float *cb, float *cr, ui32 repeat)
void gen_rct_forward(const line_buf *r, const line_buf *g, const line_buf *b, line_buf *y, line_buf *cb, line_buf *cr, ui32 repeat)
void avx_ict_forward(const float *r, const float *g, const float *b, float *y, float *cb, float *cr, ui32 repeat)
void gen_rct_backward(const line_buf *y, const line_buf *cb, const line_buf *cr, line_buf *r, line_buf *g, line_buf *b, ui32 repeat)
void sse2_rev_convert(const line_buf *src_line, const ui32 src_line_offset, line_buf *dst_line, const ui32 dst_line_offset, si64 shift, ui32 width)
void avx_cnvrt_si32_to_float_shftd(const si32 *sp, float *dp, float mul, ui32 width)
void avx2_rct_backward(const line_buf *y, const line_buf *cb, const line_buf *cr, line_buf *r, line_buf *g, line_buf *b, ui32 repeat)
void(* ict_backward)(const float *y, const float *cb, const float *cr, float *r, float *g, float *b, ui32 repeat)
void sse2_rev_convert_nlt_type3(const line_buf *src_line, const ui32 src_line_offset, line_buf *dst_line, const ui32 dst_line_offset, si64 shift, ui32 width)
void wasm_rev_convert(const line_buf *src_line, const ui32 src_line_offset, line_buf *dst_line, const ui32 dst_line_offset, si64 shift, ui32 width)
void gen_cnvrt_si32_to_float(const si32 *sp, float *dp, float mul, ui32 width)
void init_colour_transform_functions()
void gen_ict_forward(const float *r, const float *g, const float *b, float *y, float *cb, float *cr, ui32 repeat)
void sse_cnvrt_float_to_si32_shftd(const float *sp, si32 *dp, float mul, ui32 width)
void wasm_cnvrt_float_to_si32(const float *sp, si32 *dp, float mul, ui32 width)
void sse2_cnvrt_float_to_si32_shftd(const float *sp, si32 *dp, float mul, ui32 width)
void(* cnvrt_float_to_si32_shftd)(const float *sp, si32 *dp, float mul, ui32 width)
void(* rct_backward)(const line_buf *r, const line_buf *g, const line_buf *b, line_buf *y, line_buf *cb, line_buf *cr, ui32 repeat)
void gen_rev_convert_nlt_type3(const line_buf *src_line, const ui32 src_line_offset, line_buf *dst_line, const ui32 dst_line_offset, si64 shift, ui32 width)
void sse_ict_forward(const float *r, const float *g, const float *b, float *y, float *cb, float *cr, ui32 repeat)
void avx2_rev_convert(const line_buf *src_line, const ui32 src_line_offset, line_buf *dst_line, const ui32 dst_line_offset, si64 shift, ui32 width)
void avx_cnvrt_si32_to_float(const si32 *sp, float *dp, float mul, ui32 width)
static bool colour_transform_functions_initialized
void wasm_rct_backward(const line_buf *y, const line_buf *cb, const line_buf *cr, line_buf *r, line_buf *g, line_buf *b, ui32 repeat)
void sse_cnvrt_si32_to_float_shftd(const si32 *sp, float *dp, float mul, ui32 width)
void wasm_rct_forward(const line_buf *r, const line_buf *g, const line_buf *b, line_buf *y, line_buf *cb, line_buf *cr, ui32 repeat)
void wasm_ict_forward(const float *r, const float *g, const float *b, float *y, float *cb, float *cr, ui32 repeat)
void(* cnvrt_si32_to_float)(const si32 *sp, float *dp, float mul, ui32 width)
void avx2_rev_convert_nlt_type3(const line_buf *src_line, const ui32 src_line_offset, line_buf *dst_line, const ui32 dst_line_offset, si64 shift, ui32 width)
void gen_cnvrt_float_to_si32(const float *sp, si32 *dp, float mul, ui32 width)
void gen_ict_backward(const float *y, const float *cb, const float *cr, float *r, float *g, float *b, ui32 repeat)
void wasm_cnvrt_si32_to_float(const si32 *sp, float *dp, float mul, ui32 width)
void gen_rev_convert(const line_buf *src_line, const ui32 src_line_offset, line_buf *dst_line, const ui32 dst_line_offset, si64 shift, ui32 width)
void gen_cnvrt_float_to_si32_shftd(const float *sp, si32 *dp, float mul, ui32 width)
void sse2_rct_forward(const line_buf *r, const line_buf *g, const line_buf *b, line_buf *y, line_buf *cb, line_buf *cr, ui32 repeat)
void avx_cnvrt_float_to_si32_shftd(const float *sp, si32 *dp, float mul, ui32 width)
void avx_ict_backward(const float *y, const float *cb, const float *cr, float *r, float *g, float *b, ui32 repeat)
void sse2_cnvrt_float_to_si32(const float *sp, si32 *dp, float mul, ui32 width)
void sse_cnvrt_si32_to_float(const si32 *sp, float *dp, float mul, ui32 width)
void(* rev_convert_nlt_type3)(const line_buf *src_line, const ui32 src_line_offset, line_buf *dst_line, const ui32 dst_line_offset, si64 shift, ui32 width)
void(* rev_convert)(const line_buf *src_line, const ui32 src_line_offset, line_buf *dst_line, const ui32 dst_line_offset, si64 shift, ui32 width)
void gen_cnvrt_si32_to_float_shftd(const si32 *sp, float *dp, float mul, ui32 width)
void sse_ict_backward(const float *y, const float *cb, const float *cr, float *r, float *g, float *b, ui32 repeat)
void sse_cnvrt_float_to_si32(const float *sp, si32 *dp, float mul, ui32 width)
@ X86_CPU_EXT_LEVEL_AVX2
Definition ojph_arch.h:138
@ X86_CPU_EXT_LEVEL_AVX
Definition ojph_arch.h:137
@ X86_CPU_EXT_LEVEL_SSE2
Definition ojph_arch.h:132
@ X86_CPU_EXT_LEVEL_SSE
Definition ojph_arch.h:131
int64_t si64
Definition ojph_defs.h:57
static si32 ojph_round(float val)
Definition ojph_arch.h:263
OJPH_EXPORT int get_cpu_ext_level()
int32_t si32
Definition ojph_defs.h:55
uint32_t ui32
Definition ojph_defs.h:54
static const float GAMMA_CR2R
static const float BETA_CbF
static const float GAMMA_CB2B
static const float ALPHA_RF
static const float GAMMA_CB2G
static const float GAMMA_CR2G
static const float ALPHA_BF
static const float BETA_CrF
static const float ALPHA_GF