660 lines
		
	
	
		
			25 KiB
		
	
	
	
		
			C
		
	
	
	
			
		
		
	
	
			660 lines
		
	
	
		
			25 KiB
		
	
	
	
		
			C
		
	
	
	
| /********************************************************************
 | |
|  *                                                                  *
 | |
|  * THIS FILE IS PART OF THE 'ZYWRLE' VNC CODEC SOURCE CODE.         *
 | |
|  *                                                                  *
 | |
|  * USE, DISTRIBUTION AND REPRODUCTION OF THIS LIBRARY SOURCE IS     *
 | |
|  * GOVERNED BY A FOLLOWING BSD-STYLE SOURCE LICENSE.                *
 | |
|  * PLEASE READ THESE TERMS BEFORE DISTRIBUTING.                     *
 | |
|  *                                                                  *
 | |
|  * THE 'ZYWRLE' VNC CODEC SOURCE CODE IS (C) COPYRIGHT 2006         *
 | |
|  * BY Hitachi Systems & Services, Ltd.                              *
 | |
|  * (Noriaki Yamazaki, Research & Developement Center)               *
 | |
|  *                                                                  *
 | |
|  *                                                                  *
 | |
|  ********************************************************************
 | |
| Redistribution and use in source and binary forms, with or without
 | |
| modification, are permitted provided that the following conditions
 | |
| are met:
 | |
| 
 | |
| - Redistributions of source code must retain the above copyright
 | |
| notice, this list of conditions and the following disclaimer.
 | |
| 
 | |
| - Redistributions in binary form must reproduce the above copyright
 | |
| notice, this list of conditions and the following disclaimer in the
 | |
| documentation and/or other materials provided with the distribution.
 | |
| 
 | |
| - Neither the name of the Hitachi Systems & Services, Ltd. nor
 | |
| the names of its contributors may be used to endorse or promote
 | |
| products derived from this software without specific prior written
 | |
| permission.
 | |
| 
 | |
| THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 | |
| ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 | |
| LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 | |
| A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION
 | |
| OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 | |
| SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 | |
| LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 | |
| DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 | |
| THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 | |
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 | |
| OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 | |
|  ********************************************************************/
 | |
| 
 | |
| #ifndef VNC_ENCODING_ZYWRLE_H
 | |
| #define VNC_ENCODING_ZYWRLE_H
 | |
| 
 | |
| /* Tables for Coefficients filtering. */
 | |
| #ifndef ZYWRLE_QUANTIZE
 | |
| /* Type A:lower bit omitting of EZW style. */
 | |
| static const unsigned int zywrle_param[3][3]={
 | |
| 	{0x0000F000, 0x00000000, 0x00000000},
 | |
| 	{0x0000C000, 0x00F0F0F0, 0x00000000},
 | |
| 	{0x0000C000, 0x00C0C0C0, 0x00F0F0F0},
 | |
| /*	{0x0000FF00, 0x00000000, 0x00000000},
 | |
| 	{0x0000FF00, 0x00FFFFFF, 0x00000000},
 | |
| 	{0x0000FF00, 0x00FFFFFF, 0x00FFFFFF}, */
 | |
| };
 | |
| #else
 | |
| /* Type B:Non liner quantization filter. */
 | |
| static const int8_t zywrle_conv[4][256]={
 | |
| {	/* bi=5, bo=5 r=0.0:PSNR=24.849 */
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| },
 | |
| {	/* bi=5, bo=5 r=2.0:PSNR=74.031 */
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 32,
 | |
| 	32, 32, 32, 32, 32, 32, 32, 32,
 | |
| 	32, 32, 32, 32, 32, 32, 32, 32,
 | |
| 	48, 48, 48, 48, 48, 48, 48, 48,
 | |
| 	48, 48, 48, 56, 56, 56, 56, 56,
 | |
| 	56, 56, 56, 56, 64, 64, 64, 64,
 | |
| 	64, 64, 64, 64, 72, 72, 72, 72,
 | |
| 	72, 72, 72, 72, 80, 80, 80, 80,
 | |
| 	80, 80, 88, 88, 88, 88, 88, 88,
 | |
| 	88, 88, 88, 88, 88, 88, 96, 96,
 | |
| 	96, 96, 96, 104, 104, 104, 104, 104,
 | |
| 	104, 104, 104, 104, 104, 112, 112, 112,
 | |
| 	112, 112, 112, 112, 112, 112, 120, 120,
 | |
| 	120, 120, 120, 120, 120, 120, 120, 120,
 | |
| 	0, -120, -120, -120, -120, -120, -120, -120,
 | |
| 	-120, -120, -120, -112, -112, -112, -112, -112,
 | |
| 	-112, -112, -112, -112, -104, -104, -104, -104,
 | |
| 	-104, -104, -104, -104, -104, -104, -96, -96,
 | |
| 	-96, -96, -96, -88, -88, -88, -88, -88,
 | |
| 	-88, -88, -88, -88, -88, -88, -88, -80,
 | |
| 	-80, -80, -80, -80, -80, -72, -72, -72,
 | |
| 	-72, -72, -72, -72, -72, -64, -64, -64,
 | |
| 	-64, -64, -64, -64, -64, -56, -56, -56,
 | |
| 	-56, -56, -56, -56, -56, -56, -48, -48,
 | |
| 	-48, -48, -48, -48, -48, -48, -48, -48,
 | |
| 	-48, -32, -32, -32, -32, -32, -32, -32,
 | |
| 	-32, -32, -32, -32, -32, -32, -32, -32,
 | |
| 	-32, -32, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| },
 | |
| {	/* bi=5, bo=4 r=2.0:PSNR=64.441 */
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	48, 48, 48, 48, 48, 48, 48, 48,
 | |
| 	48, 48, 48, 48, 48, 48, 48, 48,
 | |
| 	48, 48, 48, 48, 48, 48, 48, 48,
 | |
| 	64, 64, 64, 64, 64, 64, 64, 64,
 | |
| 	64, 64, 64, 64, 64, 64, 64, 64,
 | |
| 	80, 80, 80, 80, 80, 80, 80, 80,
 | |
| 	80, 80, 80, 80, 80, 88, 88, 88,
 | |
| 	88, 88, 88, 88, 88, 88, 88, 88,
 | |
| 	104, 104, 104, 104, 104, 104, 104, 104,
 | |
| 	104, 104, 104, 112, 112, 112, 112, 112,
 | |
| 	112, 112, 112, 112, 120, 120, 120, 120,
 | |
| 	120, 120, 120, 120, 120, 120, 120, 120,
 | |
| 	0, -120, -120, -120, -120, -120, -120, -120,
 | |
| 	-120, -120, -120, -120, -120, -112, -112, -112,
 | |
| 	-112, -112, -112, -112, -112, -112, -104, -104,
 | |
| 	-104, -104, -104, -104, -104, -104, -104, -104,
 | |
| 	-104, -88, -88, -88, -88, -88, -88, -88,
 | |
| 	-88, -88, -88, -88, -80, -80, -80, -80,
 | |
| 	-80, -80, -80, -80, -80, -80, -80, -80,
 | |
| 	-80, -64, -64, -64, -64, -64, -64, -64,
 | |
| 	-64, -64, -64, -64, -64, -64, -64, -64,
 | |
| 	-64, -48, -48, -48, -48, -48, -48, -48,
 | |
| 	-48, -48, -48, -48, -48, -48, -48, -48,
 | |
| 	-48, -48, -48, -48, -48, -48, -48, -48,
 | |
| 	-48, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| },
 | |
| {	/* bi=5, bo=2 r=2.0:PSNR=43.175 */
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	88, 88, 88, 88, 88, 88, 88, 88,
 | |
| 	88, 88, 88, 88, 88, 88, 88, 88,
 | |
| 	88, 88, 88, 88, 88, 88, 88, 88,
 | |
| 	88, 88, 88, 88, 88, 88, 88, 88,
 | |
| 	88, 88, 88, 88, 88, 88, 88, 88,
 | |
| 	88, 88, 88, 88, 88, 88, 88, 88,
 | |
| 	88, 88, 88, 88, 88, 88, 88, 88,
 | |
| 	88, 88, 88, 88, 88, 88, 88, 88,
 | |
| 	0, -88, -88, -88, -88, -88, -88, -88,
 | |
| 	-88, -88, -88, -88, -88, -88, -88, -88,
 | |
| 	-88, -88, -88, -88, -88, -88, -88, -88,
 | |
| 	-88, -88, -88, -88, -88, -88, -88, -88,
 | |
| 	-88, -88, -88, -88, -88, -88, -88, -88,
 | |
| 	-88, -88, -88, -88, -88, -88, -88, -88,
 | |
| 	-88, -88, -88, -88, -88, -88, -88, -88,
 | |
| 	-88, -88, -88, -88, -88, -88, -88, -88,
 | |
| 	-88, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| 	0, 0, 0, 0, 0, 0, 0, 0,
 | |
| }
 | |
| };
 | |
| 
 | |
| static const int8_t *zywrle_param[3][3][3]={
 | |
| 	{{zywrle_conv[0], zywrle_conv[2], zywrle_conv[0]},
 | |
|          {zywrle_conv[0], zywrle_conv[0], zywrle_conv[0]},
 | |
|          {zywrle_conv[0], zywrle_conv[0], zywrle_conv[0]}},
 | |
| 	{{zywrle_conv[0], zywrle_conv[3], zywrle_conv[0]},
 | |
|          {zywrle_conv[1], zywrle_conv[1], zywrle_conv[1]},
 | |
|          {zywrle_conv[0], zywrle_conv[0], zywrle_conv[0]}},
 | |
| 	{{zywrle_conv[0], zywrle_conv[3], zywrle_conv[0]},
 | |
|          {zywrle_conv[2], zywrle_conv[2], zywrle_conv[2]},
 | |
|          {zywrle_conv[1], zywrle_conv[1], zywrle_conv[1]}},
 | |
| };
 | |
| #endif
 | |
| 
 | |
| /*   Load/Save pixel stuffs. */
 | |
| #define ZYWRLE_YMASK15  0xFFFFFFF8
 | |
| #define ZYWRLE_UVMASK15 0xFFFFFFF8
 | |
| #define ZYWRLE_LOAD_PIXEL15(src, r, g, b)                               \
 | |
|     do {                                                                \
 | |
| 	r = (((uint8_t*)src)[S_1]<< 1)& 0xF8;                           \
 | |
| 	g = (((uint8_t*)src)[S_1]<< 6) | (((uint8_t*)src)[S_0]>> 2);    \
 | |
|         g &= 0xF8;                                                      \
 | |
| 	b =  (((uint8_t*)src)[S_0]<< 3)& 0xF8;                          \
 | |
|     } while (0)
 | |
| 
 | |
| #define ZYWRLE_SAVE_PIXEL15(dst, r, g, b)                               \
 | |
|     do {                                                                \
 | |
| 	r &= 0xF8;                                                      \
 | |
| 	g &= 0xF8;                                                      \
 | |
| 	b &= 0xF8;                                                      \
 | |
| 	((uint8_t*)dst)[S_1] = (uint8_t)((r >> 1)|(g >> 6));            \
 | |
| 	((uint8_t*)dst)[S_0] = (uint8_t)(((b >> 3)|(g << 2))& 0xFF);    \
 | |
|     } while (0)
 | |
| 
 | |
| #define ZYWRLE_YMASK16  0xFFFFFFFC
 | |
| #define ZYWRLE_UVMASK16 0xFFFFFFF8
 | |
| #define ZYWRLE_LOAD_PIXEL16(src, r, g, b)                               \
 | |
|     do {                                                                \
 | |
| 	r = ((uint8_t*)src)[S_1] & 0xF8;                                \
 | |
| 	g = (((uint8_t*)src)[S_1]<< 5) | (((uint8_t*)src)[S_0] >> 3);   \
 | |
|         g &= 0xFC;                                                      \
 | |
| 	b = (((uint8_t*)src)[S_0]<< 3) & 0xF8;                          \
 | |
|     } while (0)
 | |
| 
 | |
| #define ZYWRLE_SAVE_PIXEL16(dst, r, g,b)                                \
 | |
|     do {                                                                \
 | |
| 	r &= 0xF8;                                                      \
 | |
| 	g &= 0xFC;                                                      \
 | |
| 	b &= 0xF8;                                                      \
 | |
| 	((uint8_t*)dst)[S_1] = (uint8_t)(r | (g >> 5));                 \
 | |
| 	((uint8_t*)dst)[S_0] = (uint8_t)(((b >> 3)|(g << 3)) & 0xFF);   \
 | |
|     } while (0)
 | |
| 
 | |
| #define ZYWRLE_YMASK32  0xFFFFFFFF
 | |
| #define ZYWRLE_UVMASK32 0xFFFFFFFF
 | |
| #define ZYWRLE_LOAD_PIXEL32(src, r, g, b)     \
 | |
|     do {                                      \
 | |
| 	r = ((uint8_t*)src)[L_2];             \
 | |
| 	g = ((uint8_t*)src)[L_1];             \
 | |
| 	b = ((uint8_t*)src)[L_0];             \
 | |
|     } while (0)
 | |
| #define ZYWRLE_SAVE_PIXEL32(dst, r, g, b)             \
 | |
|     do {                                              \
 | |
| 	((uint8_t*)dst)[L_2] = (uint8_t)r;            \
 | |
| 	((uint8_t*)dst)[L_1] = (uint8_t)g;            \
 | |
| 	((uint8_t*)dst)[L_0] = (uint8_t)b;            \
 | |
|     } while (0)
 | |
| 
 | |
| static inline void harr(int8_t *px0, int8_t *px1)
 | |
| {
 | |
|     /* Piecewise-Linear Harr(PLHarr) */
 | |
|     int x0 = (int)*px0, x1 = (int)*px1;
 | |
|     int orgx0 = x0, orgx1 = x1;
 | |
| 
 | |
|     if ((x0 ^ x1) & 0x80) {
 | |
|         /* differ sign */
 | |
|         x1 += x0;
 | |
|         if (((x1 ^ orgx1) & 0x80) == 0) {
 | |
|             /* |x1| > |x0| */
 | |
|             x0 -= x1;	/* H = -B */
 | |
|         }
 | |
|     } else {
 | |
|         /* same sign */
 | |
|         x0 -= x1;
 | |
|         if (((x0 ^ orgx0) & 0x80) == 0) {
 | |
|             /* |x0| > |x1| */
 | |
|             x1 += x0;	/* L = A */
 | |
|         }
 | |
|     }
 | |
|     *px0 = (int8_t)x1;
 | |
|     *px1 = (int8_t)x0;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  1D-Wavelet transform.
 | |
| 
 | |
|  In coefficients array, the famous 'pyramid' decomposition is well used.
 | |
| 
 | |
|  1D Model:
 | |
|    |L0L0L0L0|L0L0L0L0|H0H0H0H0|H0H0H0H0| : level 0
 | |
|    |L1L1L1L1|H1H1H1H1|H0H0H0H0|H0H0H0H0| : level 1
 | |
| 
 | |
|  But this method needs line buffer because H/L is different position from X0/X1.
 | |
|  So, I used 'interleave' decomposition instead of it.
 | |
| 
 | |
|  1D Model:
 | |
|    |L0H0L0H0|L0H0L0H0|L0H0L0H0|L0H0L0H0| : level 0
 | |
|    |L1H0H1H0|L1H0H1H0|L1H0H1H0|L1H0H1H0| : level 1
 | |
| 
 | |
|  In this method, H/L and X0/X1 is always same position.
 | |
|  This lead us to more speed and less memory.
 | |
|  Of cause, the result of both method is quite same
 | |
|  because it's only difference that coefficient position.
 | |
| */
 | |
| static inline void wavelet_level(int *data, int size, int l, int skip_pixel)
 | |
| {
 | |
|     int s, ofs;
 | |
|     int8_t *px0;
 | |
|     int8_t *end;
 | |
| 
 | |
|     px0 = (int8_t*)data;
 | |
|     s = (8 << l) * skip_pixel;
 | |
|     end = px0 + (size >> (l + 1)) * s;
 | |
|     s -= 2;
 | |
|     ofs = (4 << l) * skip_pixel;
 | |
| 
 | |
|     while (px0 < end) {
 | |
|         harr(px0, px0 + ofs);
 | |
|         px0++;
 | |
|         harr(px0, px0 + ofs);
 | |
|         px0++;
 | |
|         harr(px0, px0 + ofs);
 | |
|         px0 += s;
 | |
|     }
 | |
| }
 | |
| 
 | |
| #ifndef ZYWRLE_QUANTIZE
 | |
| /* Type A:lower bit omitting of EZW style. */
 | |
| static inline void filter_wavelet_square(int *buf, int width, int height,
 | |
|                                          int level, int l)
 | |
| {
 | |
|     int r, s;
 | |
|     int x, y;
 | |
|     int *h;
 | |
|     const unsigned int *m;
 | |
| 
 | |
|     m = &(zywrle_param[level - 1][l]);
 | |
|     s = 2 << l;
 | |
| 
 | |
|     for (r = 1; r < 4; r++) {
 | |
|         h = buf;
 | |
|         if (r & 0x01) {
 | |
|             h += s >> 1;
 | |
|         }
 | |
|         if (r & 0x02) {
 | |
|             h += (s >> 1) * width;
 | |
|         }
 | |
|         for (y = 0; y < height / s; y++) {
 | |
|             for (x = 0; x < width / s; x++) {
 | |
|                 /*
 | |
|                   these are same following code.
 | |
|                   h[x] = h[x] / (~m[x]+1) * (~m[x]+1);
 | |
|                   ( round h[x] with m[x] bit )
 | |
|                   '&' operator isn't 'round' but is 'floor'.
 | |
|                   So, we must offset when h[x] is negative.
 | |
|                 */
 | |
|                 if (((int8_t*)h)[0] & 0x80) {
 | |
|                     ((int8_t*)h)[0] += ~((int8_t*)m)[0];
 | |
|                 }
 | |
|                 if (((int8_t*)h)[1] & 0x80) {
 | |
|                     ((int8_t*)h)[1] += ~((int8_t*)m)[1];
 | |
|                 }
 | |
|                 if (((int8_t*)h)[2] & 0x80) {
 | |
|                     ((int8_t*)h)[2] += ~((int8_t*)m)[2];
 | |
|                 }
 | |
|                 *h &= *m;
 | |
|                 h += s;
 | |
|             }
 | |
|             h += (s-1)*width;
 | |
|         }
 | |
|     }
 | |
| }
 | |
| #else
 | |
| /*
 | |
|  Type B:Non liner quantization filter.
 | |
| 
 | |
|  Coefficients have Gaussian curve and smaller value which is
 | |
|  large part of coefficients isn't more important than larger value.
 | |
|  So, I use filter of Non liner quantize/dequantize table.
 | |
|  In general, Non liner quantize formula is explained as following.
 | |
| 
 | |
|     y=f(x)   = sign(x)*round( ((abs(x)/(2^7))^ r   )* 2^(bo-1) )*2^(8-bo)
 | |
|     x=f-1(y) = sign(y)*round( ((abs(y)/(2^7))^(1/r))* 2^(bi-1) )*2^(8-bi)
 | |
|  ( r:power coefficient  bi:effective MSB in input  bo:effective MSB in output )
 | |
| 
 | |
|    r < 1.0 : Smaller value is more important than larger value.
 | |
|    r > 1.0 : Larger value is more important than smaller value.
 | |
|    r = 1.0 : Liner quantization which is same with EZW style.
 | |
| 
 | |
|  r = 0.75 is famous non liner quantization used in MP3 audio codec.
 | |
|  In contrast to audio data, larger value is important in wavelet coefficients.
 | |
|  So, I select r = 2.0 table( quantize is x^2, dequantize sqrt(x) ).
 | |
| 
 | |
|  As compared with EZW style liner quantization, this filter tended to be
 | |
|  more sharp edge and be more compression rate but be more blocking noise and be
 | |
|  less quality. Especially, the surface of graphic objects has distinguishable
 | |
|  noise in middle quality mode.
 | |
| 
 | |
|  We need only quantized-dequantized(filtered) value rather than quantized value
 | |
|  itself because all values are packed or palette-lized in later ZRLE section.
 | |
|  This lead us not to need to modify client decoder when we change
 | |
|  the filtering procedure in future.
 | |
|  Client only decodes coefficients given by encoder.
 | |
| */
 | |
| static inline void filter_wavelet_square(int *buf, int width, int height,
 | |
|                                          int level, int l)
 | |
| {
 | |
|     int r, s;
 | |
|     int x, y;
 | |
|     int *h;
 | |
|     const int8_t **m;
 | |
| 
 | |
|     m = zywrle_param[level - 1][l];
 | |
|     s = 2 << l;
 | |
| 
 | |
|     for (r = 1; r < 4; r++) {
 | |
|         h = buf;
 | |
|         if (r & 0x01) {
 | |
|             h += s >> 1;
 | |
|         }
 | |
|         if (r & 0x02) {
 | |
|             h += (s >> 1) * width;
 | |
|         }
 | |
|         for (y = 0; y < height / s; y++) {
 | |
|             for (x = 0; x < width / s; x++) {
 | |
|                 ((int8_t*)h)[0] = m[0][((uint8_t*)h)[0]];
 | |
|                 ((int8_t*)h)[1] = m[1][((uint8_t*)h)[1]];
 | |
|                 ((int8_t*)h)[2] = m[2][((uint8_t*)h)[2]];
 | |
|                 h += s;
 | |
|             }
 | |
|             h += (s - 1) * width;
 | |
|         }
 | |
|     }
 | |
| }
 | |
| #endif
 | |
| 
 | |
| static inline void wavelet(int *buf, int width, int height, int level)
 | |
| {
 | |
| 	int l, s;
 | |
| 	int *top;
 | |
| 	int *end;
 | |
| 
 | |
| 	for (l = 0; l < level; l++) {
 | |
| 		top = buf;
 | |
| 		end = buf + height * width;
 | |
| 		s = width << l;
 | |
| 		while (top < end) {
 | |
| 			wavelet_level(top, width, l, 1);
 | |
| 			top += s;
 | |
| 		}
 | |
| 		top = buf;
 | |
| 		end = buf + width;
 | |
| 		s = 1<<l;
 | |
| 		while (top < end) {
 | |
| 			wavelet_level(top, height, l, width);
 | |
| 			top += s;
 | |
| 		}
 | |
| 		filter_wavelet_square(buf, width, height, level, l);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| 
 | |
| /* Load/Save coefficients stuffs.
 | |
|  Coefficients manages as 24 bits little-endian pixel. */
 | |
| #define ZYWRLE_LOAD_COEFF(src, r, g, b)         \
 | |
|     do {                                        \
 | |
| 	r = ((int8_t*)src)[2];                  \
 | |
| 	g = ((int8_t*)src)[1];                  \
 | |
| 	b = ((int8_t*)src)[0];                  \
 | |
|     } while (0)
 | |
| 
 | |
| #define ZYWRLE_SAVE_COEFF(dst, r, g, b)       \
 | |
|     do {                                      \
 | |
| 	((int8_t*)dst)[2] = (int8_t)r;        \
 | |
| 	((int8_t*)dst)[1] = (int8_t)g;        \
 | |
| 	((int8_t*)dst)[0] = (int8_t)b;        \
 | |
|     } while (0)
 | |
| 
 | |
| /*
 | |
|   RGB <=> YUV conversion stuffs.
 | |
|   YUV coversion is explained as following formula in strict meaning:
 | |
|   Y =  0.299R + 0.587G + 0.114B (   0<=Y<=255)
 | |
|   U = -0.169R - 0.331G + 0.500B (-128<=U<=127)
 | |
|   V =  0.500R - 0.419G - 0.081B (-128<=V<=127)
 | |
| 
 | |
|   I use simple conversion RCT(reversible color transform) which is described
 | |
|   in JPEG-2000 specification.
 | |
|   Y = (R + 2G + B)/4 (   0<=Y<=255)
 | |
|   U = B-G (-256<=U<=255)
 | |
|   V = R-G (-256<=V<=255)
 | |
| */
 | |
| 
 | |
| /* RCT is N-bit RGB to N-bit Y and N+1-bit UV.
 | |
|    For make Same N-bit, UV is lossy.
 | |
|    More exact PLHarr, we reduce to odd range(-127<=x<=127). */
 | |
| #define ZYWRLE_RGBYUV_(r, g, b, y, u, v, ymask, uvmask)          \
 | |
|     do {                                                         \
 | |
| 	y = (r + (g << 1) + b) >> 2;                             \
 | |
| 	u =  b - g;                                              \
 | |
| 	v =  r - g;                                              \
 | |
| 	y -= 128;                                                \
 | |
| 	u >>= 1;                                                 \
 | |
| 	v >>= 1;                                                 \
 | |
| 	y &= ymask;                                              \
 | |
| 	u &= uvmask;                                             \
 | |
| 	v &= uvmask;                                             \
 | |
| 	if (y == -128) {                                         \
 | |
|             y += (0xFFFFFFFF - ymask + 1);                       \
 | |
|         }                                                        \
 | |
| 	if (u == -128) {                                         \
 | |
|             u += (0xFFFFFFFF - uvmask + 1);                      \
 | |
|         }                                                        \
 | |
| 	if (v == -128) {                                         \
 | |
|             v += (0xFFFFFFFF - uvmask + 1);                      \
 | |
|         }                                                        \
 | |
|     } while (0)
 | |
| 
 | |
| 
 | |
| /*
 | |
|  coefficient packing/unpacking stuffs.
 | |
|  Wavelet transform makes 4 sub coefficient image from 1 original image.
 | |
| 
 | |
|  model with pyramid decomposition:
 | |
|    +------+------+
 | |
|    |      |      |
 | |
|    |  L   |  Hx  |
 | |
|    |      |      |
 | |
|    +------+------+
 | |
|    |      |      |
 | |
|    |  H   |  Hxy |
 | |
|    |      |      |
 | |
|    +------+------+
 | |
| 
 | |
|  So, we must transfer each sub images individually in strict meaning.
 | |
|  But at least ZRLE meaning, following one decompositon image is same as
 | |
|  avobe individual sub image. I use this format.
 | |
|  (Strictly saying, transfer order is reverse(Hxy->Hy->Hx->L)
 | |
|   for simplified procedure for any wavelet level.)
 | |
| 
 | |
|    +------+------+
 | |
|    |      L      |
 | |
|    +------+------+
 | |
|    |      Hx     |
 | |
|    +------+------+
 | |
|    |      Hy     |
 | |
|    +------+------+
 | |
|    |      Hxy    |
 | |
|    +------+------+
 | |
| */
 | |
| #define ZYWRLE_INC_PTR(data)                         \
 | |
|     do {                                             \
 | |
|         data++;                                      \
 | |
|         if( data - p >= (w + uw) ) {                 \
 | |
|             data += scanline-(w + uw);               \
 | |
|             p = data;                                \
 | |
|         }                                            \
 | |
|     } while (0)
 | |
| 
 | |
| #define ZYWRLE_TRANSFER_COEFF(buf, data, t, w, h, scanline, level, TRANS) \
 | |
|     do {                                                                \
 | |
|         ph = buf;                                                       \
 | |
|         s = 2 << level;                                                 \
 | |
|         if (t & 0x01) {                                                 \
 | |
|             ph += s >> 1;                                               \
 | |
|         }                                                               \
 | |
|         if (t & 0x02) {                                                 \
 | |
|             ph += (s >> 1) * w;                                         \
 | |
|         }                                                               \
 | |
|         end = ph + h * w;                                               \
 | |
|         while (ph < end) {                                              \
 | |
|             line = ph + w;                                              \
 | |
|             while (ph < line) {                                         \
 | |
|                 TRANS                                                   \
 | |
|                     ZYWRLE_INC_PTR(data);                               \
 | |
|                 ph += s;                                                \
 | |
|             }                                                           \
 | |
|             ph += (s - 1) * w;                                          \
 | |
|         }                                                               \
 | |
|     } while (0)
 | |
| 
 | |
| #define ZYWRLE_PACK_COEFF(buf, data, t, width, height, scanline, level)	\
 | |
|     ZYWRLE_TRANSFER_COEFF(buf, data, t, width, height, scanline, level, \
 | |
|                           ZYWRLE_LOAD_COEFF(ph, r, g, b);               \
 | |
|                           ZYWRLE_SAVE_PIXEL(data, r, g, b);)
 | |
| 
 | |
| #define ZYWRLE_UNPACK_COEFF(buf, data, t, width, height, scanline, level) \
 | |
|     ZYWRLE_TRANSFER_COEFF(buf, data, t, width, height, scanline, level, \
 | |
|                           ZYWRLE_LOAD_PIXEL(data, r, g, b);             \
 | |
|                           ZYWRLE_SAVE_COEFF(ph, r, g, b);)
 | |
| 
 | |
| #define ZYWRLE_SAVE_UNALIGN(data, TRANS)                     \
 | |
|     do {                                                     \
 | |
|         top = buf + w * h;                                   \
 | |
|         end = buf + (w + uw) * (h + uh);                     \
 | |
|         while (top < end) {                                  \
 | |
|             TRANS                                            \
 | |
|                 ZYWRLE_INC_PTR(data);                        \
 | |
|                 top++;                                       \
 | |
|         }                                                    \
 | |
|     } while (0)
 | |
| 
 | |
| #define ZYWRLE_LOAD_UNALIGN(data,TRANS)                                 \
 | |
|     do {                                                                \
 | |
|         top = buf + w * h;                                              \
 | |
|         if (uw) {                                                       \
 | |
|             p = data + w;                                               \
 | |
|             end = (int*)(p + h * scanline);                             \
 | |
|             while (p < (ZRLE_PIXEL*)end) {                              \
 | |
|                 line = (int*)(p + uw);                                  \
 | |
|                 while (p < (ZRLE_PIXEL*)line) {                         \
 | |
|                     TRANS                                               \
 | |
|                         p++;                                            \
 | |
|                     top++;                                              \
 | |
|                 }                                                       \
 | |
|                 p += scanline - uw;                                     \
 | |
|             }                                                           \
 | |
|         }                                                               \
 | |
|         if (uh) {                                                       \
 | |
|             p = data + h * scanline;                                    \
 | |
|             end = (int*)(p + uh * scanline);                            \
 | |
|             while (p < (ZRLE_PIXEL*)end) {                              \
 | |
|                 line = (int*)(p + w);                                   \
 | |
|                 while (p < (ZRLE_PIXEL*)line) {                         \
 | |
|                     TRANS                                               \
 | |
|                         p++;                                            \
 | |
|                     top++;                                              \
 | |
|                 }                                                       \
 | |
|                 p += scanline - w;                                      \
 | |
|             }                                                           \
 | |
|         }                                                               \
 | |
|         if (uw && uh) {                                                 \
 | |
|             p= data + w + h * scanline;                                 \
 | |
|             end = (int*)(p + uh * scanline);                            \
 | |
|             while (p < (ZRLE_PIXEL*)end) {                              \
 | |
|                 line = (int*)(p + uw);                                  \
 | |
|                 while (p < (ZRLE_PIXEL*)line) {                         \
 | |
|                     TRANS                                               \
 | |
|                         p++;                                            \
 | |
|                     top++;                                              \
 | |
|                 }                                                       \
 | |
|                 p += scanline-uw;                                       \
 | |
|             }                                                           \
 | |
|         }                                                               \
 | |
|     } while (0)
 | |
| 
 | |
| static inline void zywrle_calc_size(int *w, int *h, int level)
 | |
| {
 | |
|     *w &= ~((1 << level) - 1);
 | |
|     *h &= ~((1 << level) - 1);
 | |
| }
 | |
| 
 | |
| #endif
 |