dolphin/Data/User/OpenCL/TextureDecoder.cl

// Copyright (C) 2003 Dolphin Project.

// This program is free software: you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation, version 2.0.

// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU General Public License 2.0 for more details.

// A copy of the GPL 2.0 should have been included with the program.
// If not, see http://www.gnu.org/licenses/

// Official SVN repository and contact information can be found at
// http://code.google.com/p/dolphin-emu/

kernel void DecodeI4(global uchar *dst,
                     const global uchar *src, int width)
{
    int x = get_global_id(0) * 8, y = get_global_id(1) * 8;
    int srcOffset = x + y * width / 8;
    for (int iy = 0; iy < 8; iy++)
    {
        uchar4 val = vload4(srcOffset, src);
        uchar8 res;
        res.even = (val >> (uchar4)4) & (uchar4)0x0F;
        res.odd = val & (uchar4)0x0F;
        res |= res << (uchar8)4;
        vstore8(res, 0, dst + ((y + iy)*width + x));
        srcOffset++;
    }
}

kernel void DecodeI8(global uchar *dst,
                     const global uchar *src, int width)
{
    int x = get_global_id(0) * 8, y = get_global_id(1) * 4;
    int srcOffset = ((x * 4) + (y * width)) / 8;
    for (int iy = 0; iy < 4; iy++)
    {
        vstore8(vload8(srcOffset, src),
                0, dst + ((y + iy)*width + x));
        srcOffset++;
    }
}

kernel void DecodeIA8(global uchar *dst,
                      const global uchar *src, int width)
{
    int x = get_global_id(0) * 4, y = get_global_id(1) * 4;
    int srcOffset = ((x * 4) + (y * width)) / 4;
    for (int iy = 0; iy < 4; iy++)
    {
        uchar8 val = vload8(srcOffset++, src);
        uchar8 res;
        res.odd = val.even;
        res.even = val.odd;
        vstore8(res, 0, dst + ((y + iy)*width + x) * 2);
    }
}

kernel void DecodeIA4(global uchar *dst,
                     const global uchar *src, int width)
{
    int x = get_global_id(0) * 8, y = get_global_id(1) * 4;
    int srcOffset = ((x * 4) + (y * width)) / 8;
    for (int iy = 0; iy < 4; iy++)
    {
        uchar8 val = vload8(srcOffset++, src);
        uchar16 res;
        res.odd = (val >> (uchar8)4);
        res.even  = val & (uchar8)0x0F;
        res |= res << (uchar16)4;
        vstore16(res, 0, dst + ((y + iy)*width + x) * 2);
    }
}

kernel void DecodeRGBA8(global uchar *dst,
                      const global uchar *src, int width)
{
    int x = get_global_id(0) * 4, y = get_global_id(1) * 4;
    int srcOffset = (x * 2) + (y * width) / 2;
    for (int iy = 0; iy < 4; iy++)
    {
        uchar8 ar = vload8(srcOffset, src);
        uchar8 gb = vload8(srcOffset + 4, src);
        uchar16 res;
        res.even.even = gb.odd;
        res.even.odd = ar.odd;
        res.odd.even = gb.even;
        res.odd.odd = ar.even;
        vstore16(res, 0, dst + ((y + iy)*width + x) * 4);
        srcOffset++;
    }
}

kernel void DecodeRGB565(global ushort *dst,
                         const global uchar *src, int width)
{
    int x = get_global_id(0) * 4, y = get_global_id(1) * 4;
    int srcOffset = x + (y * width) / 4;
    for (int iy = 0; iy < 4; iy++)
    {
        uchar8 val = vload8(srcOffset++, src);
        vstore4(upsample(val.even, val.odd), 0, dst + ((y + iy)*width + x));
    }
}

kernel void DecodeRGB5A3(global uchar *dst,
                         const global uchar *src, int width)
{
    int x = get_global_id(0) * 4, y = get_global_id(1) * 4;
    int srcOffset = x + (y * width) / 4;
    for (int iy = 0; iy < 4; iy++)
    {
        uchar8 val = vload8(srcOffset++, src);
        ushort4 vs = upsample(val.even, val.odd);
        
        uchar16 resNoAlpha;
        resNoAlpha.s26AE = (uchar4)(vs >> (ushort4)7); // R
        resNoAlpha.s159D = (uchar4)(vs >> (ushort4)2); // G
        resNoAlpha.s048C = (uchar4)(vs << (ushort4)3); // B
        resNoAlpha &= (uchar16)0xF8;        
        resNoAlpha |= (uchar16)(resNoAlpha >> (uchar16)5); // 5 -> 8
        resNoAlpha.s37BF = (uchar4)(0xFF);
        
        uchar16 resAlpha;
        resAlpha.s26AE = val.even;                   // R
        resAlpha.s159D = val.odd >> (uchar4)4; // G
        resAlpha.s048C = val.odd;                    // B
        resAlpha &= (uchar16)0x0F;
        resAlpha |= (resAlpha << (uchar16)4);
        resAlpha.s37BF = convert_uchar4(vs >> (ushort4)7) & (uchar4)0xE0;
        resAlpha.s37BF |= ((resAlpha.s37BF >> (uchar4)3) & (uchar4)0x1C)
                            | ((resAlpha.s37BF >> (uchar4)6) & (uchar4)0x3);
        uchar16 choice = (uchar16)((uchar4)(val.even.s0),
                                   (uchar4)(val.even.s1),
                                   (uchar4)(val.even.s2),
                                   (uchar4)(val.even.s3));
        uchar16 res;
        res = select(resAlpha, resNoAlpha, choice);
        vstore16(res, 0, dst + ((y + iy) * width + x) * 4);
    }
}

uint16 unpack(uchar b)
{
    return (uint16)((uint4)(b >> 6),
                    (uint4)(b >> 4 & 3),
                    (uint4)(b >> 2 & 3),
                    (uint4)(b      & 3));
}

kernel void decodeCMPRBlock(global uchar *dst,
                      const global uchar *src, int width)
{
    int x = get_global_id(0) * 4, y = get_global_id(1) * 4;
    uchar8 val = vload8(0, src);

	uchar2 colora565 = (uchar2)(val.s1, val.s3);
	uchar2 colorb565 = (uchar2)(val.s0, val.s2);
    uchar8 color32 = (uchar8)((colora565 << (uchar2)3) | (colora565 >> (uchar2)2 & (uchar2)7),
	                          (colora565 >> (uchar2)3) | (colorb565 << (uchar2)5) | (colorb565 >> (uchar2)1 & (uchar2)3),
                              (colorb565 & (uchar2)0xF8) | (colorb565 >> (uchar2)5 & (uchar2)7),
                              (uchar2)0xFF);
    uint4 colors;
    uint4 colorNoAlpha;
	ushort4 frac2 = (ushort4)(color32.even & (uchar4)0xFF) - (ushort4)(color32.odd & (uchar4)0xFF);
	uchar4 frac = convert_uchar4((frac2 * (ushort4)3) / (ushort4)8);
    colorNoAlpha = convert_uint4(color32.odd + frac);
    colorNoAlpha = (colorNoAlpha << (uint4)8) | convert_uint4(color32.even - frac);
    colorNoAlpha = (colorNoAlpha << (uint4)8) | convert_uint4(color32.odd);
    colorNoAlpha = (colorNoAlpha << (uint4)8) | convert_uint4(color32.even);

    uint4 colorAlpha;
    uchar4 midpoint = convert_uchar4((convert_ushort4(color32.odd) + convert_ushort4(color32.even) + (ushort4)1) / (ushort4)2);
    midpoint.s3 = 0xFF;
    colorAlpha = convert_uint4(midpoint);    
    colorAlpha = (colorAlpha << (uint4)8) | convert_uint4(color32.odd);
    colorAlpha = (colorAlpha << (uint4)8) | convert_uint4(color32.even);

	uint4 choice = isgreater(upsample(val.s0,val.s1),upsample(val.s2, val.s3));
	colors = select(colorNoAlpha, colorAlpha, choice);

    uint16 colorsFull = (uint16)(colors, colors, colors, colors);

    uint16 shifts = (((unpack(val.s7) << (uint16)8
	              |   unpack(val.s6)) << (uint16)8
                  |   unpack(val.s5)) << (uint16)8
                  |   unpack(val.s4)) << (uint16)3;

    vstore16(convert_uchar16(colorsFull >> (shifts & (uint16)0xFF)), 0, dst+=width * 4);
    shifts = shifts >> (uint16)8;
    vstore16(convert_uchar16(colorsFull >> (shifts & (uint16)0xFF)), 0, dst+=width * 4);
    shifts = shifts >> (uint16)8;
    vstore16(convert_uchar16(colorsFull >> (shifts & (uint16)0xFF)), 0, dst+=width * 4);
    shifts = shifts >> (uint16)8;
    vstore16(convert_uchar16(colorsFull >> (shifts & (uint16)0xFF)), 0, dst+=width * 4);
}

kernel void DecodeCMPR(global uchar *dst,
                      const global uchar *src, int width)
{
    int x = get_global_id(0) * 8, y = get_global_id(1) * 8;
    
    src += x * 4 + (y * width) / 2;
    
    decodeCMPRBlock(dst + (y * width + x) * 4, src, width);
    src += 8;
    decodeCMPRBlock(dst + (y * width + x + 4) * 4, src, width); // + 16
    src += 8;
    decodeCMPRBlock(dst + ((y + 4) * width + x) * 4, src, width); // + 16*width
    src += 8;
    decodeCMPRBlock(dst + ((y + 4) * width + x + 4) * 4, src, width); // + 16*(width+1)

}
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`// Copyright (C) 2003 Dolphin Project.`

			`// This program is free software: you can redistribute it and/or modify`
			`// it under the terms of the GNU General Public License as published by`
			`// the Free Software Foundation, version 2.0.`

			`// This program is distributed in the hope that it will be useful,`
			`// but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`// GNU General Public License 2.0 for more details.`

			`// A copy of the GPL 2.0 should have been included with the program.`
			`// If not, see http://www.gnu.org/licenses/`

			`// Official SVN repository and contact information can be found at`
			`// http://code.google.com/p/dolphin-emu/`

			`kernel void DecodeI4(global uchar *dst,`
			`const global uchar *src, int width)`
			`{`
			`int x = get_global_id(0) * 8, y = get_global_id(1) * 8;`
			`int srcOffset = x + y * width / 8;`
			`for (int iy = 0; iy < 8; iy++)`
			`{`
			`uchar4 val = vload4(srcOffset, src);`
			`uchar8 res;`
			`res.even = (val >> (uchar4)4) & (uchar4)0x0F;`
			`res.odd = val & (uchar4)0x0F;`
			`res \|= res << (uchar8)4;`
			`vstore8(res, 0, dst + ((y + iy)*width + x));`
			`srcOffset++;`
			`}`
			`}`

			`kernel void DecodeI8(global uchar *dst,`
			`const global uchar *src, int width)`
			`{`
			`int x = get_global_id(0) * 8, y = get_global_id(1) * 4;`
			`int srcOffset = ((x * 4) + (y * width)) / 8;`
			`for (int iy = 0; iy < 4; iy++)`
			`{`
			`vstore8(vload8(srcOffset, src),`
			`0, dst + ((y + iy)*width + x));`
			`srcOffset++;`
			`}`
			`}`

			`kernel void DecodeIA8(global uchar *dst,`
			`const global uchar *src, int width)`
			`{`
			`int x = get_global_id(0) * 4, y = get_global_id(1) * 4;`
			`int srcOffset = ((x * 4) + (y * width)) / 4;`
			`for (int iy = 0; iy < 4; iy++)`
			`{`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`uchar8 val = vload8(srcOffset++, src);`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`uchar8 res;`
			`res.odd = val.even;`
			`res.even = val.odd;`
			`vstore8(res, 0, dst + ((y + iy)width + x) 2);`
			`}`
			`}`

			`kernel void DecodeIA4(global uchar *dst,`
			`const global uchar *src, int width)`
			`{`
			`int x = get_global_id(0) * 8, y = get_global_id(1) * 4;`
			`int srcOffset = ((x * 4) + (y * width)) / 8;`
			`for (int iy = 0; iy < 4; iy++)`
			`{`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`uchar8 val = vload8(srcOffset++, src);`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`uchar16 res;`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`res.odd = (val >> (uchar8)4);`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`res.even = val & (uchar8)0x0F;`
			`res \|= res << (uchar16)4;`
			`vstore16(res, 0, dst + ((y + iy)width + x) 2);`
			`}`
			`}`

			`kernel void DecodeRGBA8(global uchar *dst,`
			`const global uchar *src, int width)`
			`{`
			`int x = get_global_id(0) * 4, y = get_global_id(1) * 4;`
			`int srcOffset = (x * 2) + (y * width) / 2;`
			`for (int iy = 0; iy < 4; iy++)`
			`{`
			`uchar8 ar = vload8(srcOffset, src);`
			`uchar8 gb = vload8(srcOffset + 4, src);`
			`uchar16 res;`
			`res.even.even = gb.odd;`
			`res.even.odd = ar.odd;`
			`res.odd.even = gb.even;`
			`res.odd.odd = ar.even;`
			`vstore16(res, 0, dst + ((y + iy)width + x) 4);`
			`srcOffset++;`
			`}`
			`}`

			`kernel void DecodeRGB565(global ushort *dst,`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`const global uchar *src, int width)`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`{`
			`int x = get_global_id(0) * 4, y = get_global_id(1) * 4;`
			`int srcOffset = x + (y * width) / 4;`
			`for (int iy = 0; iy < 4; iy++)`
			`{`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`uchar8 val = vload8(srcOffset++, src);`
			`vstore4(upsample(val.even, val.odd), 0, dst + ((y + iy)*width + x));`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`}`
			`}`

			`kernel void DecodeRGB5A3(global uchar *dst,`
			`const global uchar *src, int width)`
			`{`
			`int x = get_global_id(0) * 4, y = get_global_id(1) * 4;`
			`int srcOffset = x + (y * width) / 4;`
			`for (int iy = 0; iy < 4; iy++)`
			`{`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`uchar8 val = vload8(srcOffset++, src);`
			`ushort4 vs = upsample(val.even, val.odd);`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00
			`uchar16 resNoAlpha;`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`resNoAlpha.s26AE = (uchar4)(vs >> (ushort4)7); // R`
			`resNoAlpha.s159D = (uchar4)(vs >> (ushort4)2); // G`
			`resNoAlpha.s048C = (uchar4)(vs << (ushort4)3); // B`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`resNoAlpha &= (uchar16)0xF8;`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`resNoAlpha \|= (uchar16)(resNoAlpha >> (uchar16)5); // 5 -> 8`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`resNoAlpha.s37BF = (uchar4)(0xFF);`

			`uchar16 resAlpha;`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`resAlpha.s26AE = val.even; // R`
			`resAlpha.s159D = val.odd >> (uchar4)4; // G`
			`resAlpha.s048C = val.odd; // B`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`resAlpha &= (uchar16)0x0F;`
			`resAlpha \|= (resAlpha << (uchar16)4);`
			`resAlpha.s37BF = convert_uchar4(vs >> (ushort4)7) & (uchar4)0xE0;`
			`resAlpha.s37BF \|= ((resAlpha.s37BF >> (uchar4)3) & (uchar4)0x1C)`
			`\| ((resAlpha.s37BF >> (uchar4)6) & (uchar4)0x3);`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`uchar16 choice = (uchar16)((uchar4)(val.even.s0),`
			`(uchar4)(val.even.s1),`
			`(uchar4)(val.even.s2),`
			`(uchar4)(val.even.s3));`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`uchar16 res;`
			`res = select(resAlpha, resNoAlpha, choice);`
			`vstore16(res, 0, dst + ((y + iy) * width + x) * 4);`
			`}`
			`}`

apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`uint16 unpack(uchar b)`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`{`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`return (uint16)((uint4)(b >> 6),`
			`(uint4)(b >> 4 & 3),`
			`(uint4)(b >> 2 & 3),`
			`(uint4)(b & 3));`
			`}`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00
			`kernel void decodeCMPRBlock(global uchar *dst,`
			`const global uchar *src, int width)`
			`{`
			`int x = get_global_id(0) * 4, y = get_global_id(1) * 4;`
			`uchar8 val = vload8(0, src);`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00
			`uchar2 colora565 = (uchar2)(val.s1, val.s3);`
			`uchar2 colorb565 = (uchar2)(val.s0, val.s2);`
			`uchar8 color32 = (uchar8)((colora565 << (uchar2)3) \| (colora565 >> (uchar2)2 & (uchar2)7),`
			`(colora565 >> (uchar2)3) \| (colorb565 << (uchar2)5) \| (colorb565 >> (uchar2)1 & (uchar2)3),`
			`(colorb565 & (uchar2)0xF8) \| (colorb565 >> (uchar2)5 & (uchar2)7),`
			`(uchar2)0xFF);`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`uint4 colors;`
			`uint4 colorNoAlpha;`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`ushort4 frac2 = (ushort4)(color32.even & (uchar4)0xFF) - (ushort4)(color32.odd & (uchar4)0xFF);`
			`uchar4 frac = convert_uchar4((frac2 * (ushort4)3) / (ushort4)8);`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`colorNoAlpha = convert_uint4(color32.odd + frac);`
			`colorNoAlpha = (colorNoAlpha << (uint4)8) \| convert_uint4(color32.even - frac);`
			`colorNoAlpha = (colorNoAlpha << (uint4)8) \| convert_uint4(color32.odd);`
			`colorNoAlpha = (colorNoAlpha << (uint4)8) \| convert_uint4(color32.even);`

			`uint4 colorAlpha;`
			`uchar4 midpoint = convert_uchar4((convert_ushort4(color32.odd) + convert_ushort4(color32.even) + (ushort4)1) / (ushort4)2);`
			`midpoint.s3 = 0xFF;`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`colorAlpha = convert_uint4(midpoint);`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`colorAlpha = (colorAlpha << (uint4)8) \| convert_uint4(color32.odd);`
			`colorAlpha = (colorAlpha << (uint4)8) \| convert_uint4(color32.even);`

apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`uint4 choice = isgreater(upsample(val.s0,val.s1),upsample(val.s2, val.s3));`
			`colors = select(colorNoAlpha, colorAlpha, choice);`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00
			`uint16 colorsFull = (uint16)(colors, colors, colors, colors);`

apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`uint16 shifts = (((unpack(val.s7) << (uint16)8`
			`\| unpack(val.s6)) << (uint16)8`
			`\| unpack(val.s5)) << (uint16)8`
			`\| unpack(val.s4)) << (uint16)3;`

			`vstore16(convert_uchar16(colorsFull >> (shifts & (uint16)0xFF)), 0, dst+=width * 4);`
			`shifts = shifts >> (uint16)8;`
			`vstore16(convert_uchar16(colorsFull >> (shifts & (uint16)0xFF)), 0, dst+=width * 4);`
			`shifts = shifts >> (uint16)8;`
			`vstore16(convert_uchar16(colorsFull >> (shifts & (uint16)0xFF)), 0, dst+=width * 4);`
			`shifts = shifts >> (uint16)8;`
			`vstore16(convert_uchar16(colorsFull >> (shifts & (uint16)0xFF)), 0, dst+=width * 4);`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`}`

			`kernel void DecodeCMPR(global uchar *dst,`
			`const global uchar *src, int width)`
			`{`
			`int x = get_global_id(0) * 8, y = get_global_id(1) * 8;`

			`src += x * 4 + (y * width) / 2;`

			`decodeCMPRBlock(dst + (y * width + x) * 4, src, width);`
			`src += 8;`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`decodeCMPRBlock(dst + (y * width + x + 4) * 4, src, width); // + 16`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`src += 8;`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`decodeCMPRBlock(dst + ((y + 4) * width + x) * 4, src, width); // + 16*width`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00			`src += 8;`
apply a patch done by xsacha :) + some minor stuff :p what changes do: cmpr decoding is fixed and rgb5a3 is re-enabled git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5744 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-19 07:59:53 +00:00			`decodeCMPRBlock(dst + ((y + 4) * width + x + 4) * 4, src, width); // + 16*(width+1)`
Hg: enable newline normalization get revision number via `hg svn info` for svnrev.h ignore incremental/generated binary files (windows/VS at least) leave a comment if some files need native eol set in svnprops git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@5637 8ced0084-cf51-0410-be5f-012b33b47a6e 2010-06-09 01:37:08 +00:00
OpenCL: Moved the OpenCL code from the compiled source to a separate file TextureDecoder.cl and added a .rules files to copy the updated version to the build directory. Fixed RGB5A3 decoding with alpha New CMPR decoding, blocks with no alpha are great, still have to figure the problems with transparent blocks. Disabled for now. Added a better error reporting to the base OpenCL functions git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@4439 8ced0084-cf51-0410-be5f-012b33b47a6e 2009-10-20 00:55:07 +00:00			`}`