Edit

kc3-lang/angle/src/libGLESv2/renderer/Image.cpp

Branch :

  • Show log

    Commit

  • Author : daniel@transgaming.com
    Date : 2012-11-28 20:54:02
    Hash : b64ed282
    Message : Adds makeRenderer9/11 functions TRAC #22134 Signed-off-by: Nicolas Capens Signed-off-by: Daniel Koch git-svn-id: https://angleproject.googlecode.com/svn/branches/dx11proto@1479 736b8ea6-26fd-11df-bfd4-992fa37f6226

  • src/libGLESv2/renderer/Image.cpp
  • //
    // Copyright (c) 2002-2012 The ANGLE Project Authors. All rights reserved.
    // Use of this source code is governed by a BSD-style license that can be
    // found in the LICENSE file.
    //
    
    // Image.cpp: Implements the rx::Image class, which acts as the interface to
    // the actual underlying surfaces of a Texture.
    
    #include "libGLESv2/renderer/Image.h"
    
    #include "libEGL/Display.h"
    
    #include "libGLESv2/main.h"
    #include "libGLESv2/mathutil.h"
    #include "libGLESv2/utilities.h"
    #include "libGLESv2/Texture.h"
    #include "libGLESv2/Framebuffer.h"
    #include "libGLESv2/renderer/RenderTarget9.h"
    
    #include "libGLESv2/renderer/renderer9_utils.h"
    
    namespace rx
    {
    
    namespace
    {
    struct L8
    {
        unsigned char L;
    
        static void average(L8 *dst, const L8 *src1, const L8 *src2)
        {
            dst->L = ((src1->L ^ src2->L) >> 1) + (src1->L & src2->L);
        }
    };
    
    struct A8L8
    {
        unsigned char L;
        unsigned char A;
    
        static void average(A8L8 *dst, const A8L8 *src1, const A8L8 *src2)
        {
            *(unsigned short*)dst = (((*(unsigned short*)src1 ^ *(unsigned short*)src2) & 0xFEFE) >> 1) + (*(unsigned short*)src1 & *(unsigned short*)src2);
        }
    };
    
    struct A8R8G8B8
    {
        unsigned char B;
        unsigned char G;
        unsigned char R;
        unsigned char A;
    
        static void average(A8R8G8B8 *dst, const A8R8G8B8 *src1, const A8R8G8B8 *src2)
        {
            *(unsigned int*)dst = (((*(unsigned int*)src1 ^ *(unsigned int*)src2) & 0xFEFEFEFE) >> 1) + (*(unsigned int*)src1 & *(unsigned int*)src2);
        }
    };
    
    struct A16B16G16R16F
    {
        unsigned short R;
        unsigned short G;
        unsigned short B;
        unsigned short A;
    
        static void average(A16B16G16R16F *dst, const A16B16G16R16F *src1, const A16B16G16R16F *src2)
        {
            dst->R = gl::float32ToFloat16((gl::float16ToFloat32(src1->R) + gl::float16ToFloat32(src2->R)) * 0.5f);
            dst->G = gl::float32ToFloat16((gl::float16ToFloat32(src1->G) + gl::float16ToFloat32(src2->G)) * 0.5f);
            dst->B = gl::float32ToFloat16((gl::float16ToFloat32(src1->B) + gl::float16ToFloat32(src2->B)) * 0.5f);
            dst->A = gl::float32ToFloat16((gl::float16ToFloat32(src1->A) + gl::float16ToFloat32(src2->A)) * 0.5f);
        }
    };
    
    struct A32B32G32R32F
    {
        float R;
        float G;
        float B;
        float A;
    
        static void average(A32B32G32R32F *dst, const A32B32G32R32F *src1, const A32B32G32R32F *src2)
        {
            dst->R = (src1->R + src2->R) * 0.5f;
            dst->G = (src1->G + src2->G) * 0.5f;
            dst->B = (src1->B + src2->B) * 0.5f;
            dst->A = (src1->A + src2->A) * 0.5f;
        }
    };
    
    template <typename T>
    void GenerateMip(unsigned int sourceWidth, unsigned int sourceHeight,
                     const unsigned char *sourceData, int sourcePitch,
                     unsigned char *destData, int destPitch)
    {
        unsigned int mipWidth = std::max(1U, sourceWidth >> 1);
        unsigned int mipHeight = std::max(1U, sourceHeight >> 1);
    
        if (sourceHeight == 1)
        {
            ASSERT(sourceWidth != 1);
    
            const T *src = (const T*)sourceData;
            T *dst = (T*)destData;
    
            for (unsigned int x = 0; x < mipWidth; x++)
            {
                T::average(&dst[x], &src[x * 2], &src[x * 2 + 1]);
            }
        }
        else if (sourceWidth == 1)
        {
            ASSERT(sourceHeight != 1);
    
            for (unsigned int y = 0; y < mipHeight; y++)
            {
                const T *src0 = (const T*)(sourceData + y * 2 * sourcePitch);
                const T *src1 = (const T*)(sourceData + y * 2 * sourcePitch + sourcePitch);
                T *dst = (T*)(destData + y * destPitch);
    
                T::average(dst, src0, src1);
            }
        }
        else
        {
            for (unsigned int y = 0; y < mipHeight; y++)
            {
                const T *src0 = (const T*)(sourceData + y * 2 * sourcePitch);
                const T *src1 = (const T*)(sourceData + y * 2 * sourcePitch + sourcePitch);
                T *dst = (T*)(destData + y * destPitch);
    
                for (unsigned int x = 0; x < mipWidth; x++)
                {
                    T tmp0;
                    T tmp1;
    
                    T::average(&tmp0, &src0[x * 2], &src0[x * 2 + 1]);
                    T::average(&tmp1, &src1[x * 2], &src1[x * 2 + 1]);
                    T::average(&dst[x], &tmp0, &tmp1);
                }
            }
        }
    }
    
    void GenerateMip(IDirect3DSurface9 *destSurface, IDirect3DSurface9 *sourceSurface)
    {
        D3DSURFACE_DESC destDesc;
        HRESULT result = destSurface->GetDesc(&destDesc);
        ASSERT(SUCCEEDED(result));
    
        D3DSURFACE_DESC sourceDesc;
        result = sourceSurface->GetDesc(&sourceDesc);
        ASSERT(SUCCEEDED(result));
    
        ASSERT(sourceDesc.Format == destDesc.Format);
        ASSERT(sourceDesc.Width == 1 || sourceDesc.Width / 2 == destDesc.Width);
        ASSERT(sourceDesc.Height == 1 || sourceDesc.Height / 2 == destDesc.Height);
    
        D3DLOCKED_RECT sourceLocked = {0};
        result = sourceSurface->LockRect(&sourceLocked, NULL, D3DLOCK_READONLY);
        ASSERT(SUCCEEDED(result));
    
        D3DLOCKED_RECT destLocked = {0};
        result = destSurface->LockRect(&destLocked, NULL, 0);
        ASSERT(SUCCEEDED(result));
    
        const unsigned char *sourceData = reinterpret_cast<const unsigned char*>(sourceLocked.pBits);
        unsigned char *destData = reinterpret_cast<unsigned char*>(destLocked.pBits);
    
        if (sourceData && destData)
        {
            switch (sourceDesc.Format)
            {
              case D3DFMT_L8:
                GenerateMip<L8>(sourceDesc.Width, sourceDesc.Height, sourceData, sourceLocked.Pitch, destData, destLocked.Pitch);
                break;
              case D3DFMT_A8L8:
                GenerateMip<A8L8>(sourceDesc.Width, sourceDesc.Height, sourceData, sourceLocked.Pitch, destData, destLocked.Pitch);
                break;
              case D3DFMT_A8R8G8B8:
              case D3DFMT_X8R8G8B8:
                GenerateMip<A8R8G8B8>(sourceDesc.Width, sourceDesc.Height, sourceData, sourceLocked.Pitch, destData, destLocked.Pitch);
                break;
              case D3DFMT_A16B16G16R16F:
                GenerateMip<A16B16G16R16F>(sourceDesc.Width, sourceDesc.Height, sourceData, sourceLocked.Pitch, destData, destLocked.Pitch);
                break;
              case D3DFMT_A32B32G32R32F:
                GenerateMip<A32B32G32R32F>(sourceDesc.Width, sourceDesc.Height, sourceData, sourceLocked.Pitch, destData, destLocked.Pitch);
                break;
              default:
                UNREACHABLE();
                break;
            }
    
            destSurface->UnlockRect();
            sourceSurface->UnlockRect();
        }
    }
    }
    
    Image::Image()
    {
        mWidth = 0; 
        mHeight = 0;
        mInternalFormat = GL_NONE;
    
        mSurface = NULL;
    
        mDirty = false;
    
        mRenderer = NULL;
    
        mD3DPool = D3DPOOL_SYSTEMMEM;
        mD3DFormat = D3DFMT_UNKNOWN;
        mActualFormat = GL_NONE;
    }
    
    Image::~Image()
    {
        if (mSurface)
        {
            mSurface->Release();
        }
    }
    
    void Image::GenerateMipmap(Image *dest, Image *source)
    {
        IDirect3DSurface9 *sourceSurface = source->getSurface();
        if (sourceSurface == NULL)
            return error(GL_OUT_OF_MEMORY);
    
        IDirect3DSurface9 *destSurface = dest->getSurface();
        GenerateMip(destSurface, sourceSurface);
    
        source->markDirty();
    }
    
    void Image::CopyLockableSurfaces(IDirect3DSurface9 *dest, IDirect3DSurface9 *source)
    {
        D3DLOCKED_RECT sourceLock = {0};
        D3DLOCKED_RECT destLock = {0};
        
        source->LockRect(&sourceLock, NULL, 0);
        dest->LockRect(&destLock, NULL, 0);
        
        if (sourceLock.pBits && destLock.pBits)
        {
            D3DSURFACE_DESC desc;
            source->GetDesc(&desc);
    
            int rows = dx::IsCompressedFormat(desc.Format) ? desc.Height / 4 : desc.Height;
            int bytes = dx::ComputeRowSize(desc.Format, desc.Width);
            ASSERT(bytes <= sourceLock.Pitch && bytes <= destLock.Pitch);
    
            for(int i = 0; i < rows; i++)
            {
                memcpy((char*)destLock.pBits + destLock.Pitch * i, (char*)sourceLock.pBits + sourceLock.Pitch * i, bytes);
            }
    
            source->UnlockRect();
            dest->UnlockRect();
        }
        else UNREACHABLE();
    }
    
    bool Image::redefine(rx::Renderer9 *renderer, GLint internalformat, GLsizei width, GLsizei height, bool forceRelease)
    {
        if (mWidth != width ||
            mHeight != height ||
            mInternalFormat != internalformat ||
            forceRelease)
        {
            mWidth = width;
            mHeight = height;
            mInternalFormat = internalformat;
            // compute the d3d format that will be used
            mD3DFormat = renderer->ConvertTextureInternalFormat(internalformat);
            mActualFormat = d3d9_gl::GetEquivalentFormat(mD3DFormat);
    
            mRenderer = Renderer9::makeRenderer9(renderer); // D3D9_REPLACE
    
            if (mSurface)
            {
                mSurface->Release();
                mSurface = NULL;
            }
    
            return true;
        }
    
        return false;
    }
    
    void Image::createSurface()
    {
        if(mSurface)
        {
            return;
        }
    
        IDirect3DTexture9 *newTexture = NULL;
        IDirect3DSurface9 *newSurface = NULL;
        const D3DPOOL poolToUse = D3DPOOL_SYSTEMMEM;
        const D3DFORMAT d3dFormat = getD3DFormat();
        ASSERT(d3dFormat != D3DFMT_INTZ); // We should never get here for depth textures
    
        if (mWidth != 0 && mHeight != 0)
        {
            int levelToFetch = 0;
            GLsizei requestWidth = mWidth;
            GLsizei requestHeight = mHeight;
            gl::MakeValidSize(true, gl::IsCompressed(mInternalFormat), &requestWidth, &requestHeight, &levelToFetch);
    
            IDirect3DDevice9 *device = mRenderer->getDevice(); // D3D9_REPLACE
    
            HRESULT result = device->CreateTexture(requestWidth, requestHeight, levelToFetch + 1, 0, d3dFormat,
                                                        poolToUse, &newTexture, NULL);
    
            if (FAILED(result))
            {
                ASSERT(result == D3DERR_OUTOFVIDEOMEMORY || result == E_OUTOFMEMORY);
                ERR("Creating image surface failed.");
                return error(GL_OUT_OF_MEMORY);
            }
    
            newTexture->GetSurfaceLevel(levelToFetch, &newSurface);
            newTexture->Release();
        }
    
        mSurface = newSurface;
        mDirty = false;
        mD3DPool = poolToUse;
    }
    
    HRESULT Image::lock(D3DLOCKED_RECT *lockedRect, const RECT *rect)
    {
        createSurface();
    
        HRESULT result = D3DERR_INVALIDCALL;
    
        if (mSurface)
        {
            result = mSurface->LockRect(lockedRect, rect, 0);
            ASSERT(SUCCEEDED(result));
    
            mDirty = true;
        }
    
        return result;
    }
    
    void Image::unlock()
    {
        if (mSurface)
        {
            HRESULT result = mSurface->UnlockRect();
            ASSERT(SUCCEEDED(result));
        }
    }
    
    bool Image::isRenderableFormat() const
    {    
        return TextureStorage::IsTextureFormatRenderable(getD3DFormat());
    }
    
    GLenum Image::getActualFormat() const
    {
        return mActualFormat;
    }
    
    D3DFORMAT Image::getD3DFormat() const
    {
        // this should only happen if the image hasn't been redefined first
        // which would be a bug by the caller
        ASSERT(mD3DFormat != D3DFMT_UNKNOWN);
    
        return mD3DFormat;
    }
    
    IDirect3DSurface9 *Image::getSurface()
    {
        createSurface();
    
        return mSurface;
    }
    
    void Image::setManagedSurface(TextureStorage2D *storage, int level)
    {
        setManagedSurface(storage->getSurfaceLevel(level, false));
    }
    
    void Image::setManagedSurface(TextureStorageCubeMap *storage, int face, int level)
    {
        setManagedSurface(storage->getCubeMapSurface(GL_TEXTURE_CUBE_MAP_POSITIVE_X + face, level, false));
    }
    
    void Image::setManagedSurface(IDirect3DSurface9 *surface)
    {
        D3DSURFACE_DESC desc;
        surface->GetDesc(&desc);
        ASSERT(desc.Pool == D3DPOOL_MANAGED);
    
        if ((GLsizei)desc.Width == mWidth && (GLsizei)desc.Height == mHeight)
        {
            if (mSurface)
            {
                CopyLockableSurfaces(surface, mSurface);
                mSurface->Release();
            }
    
            mSurface = surface;
            mD3DPool = desc.Pool;
        }
    }
    
    bool Image::updateSurface(TextureStorage2D *storage, int level, GLint xoffset, GLint yoffset, GLsizei width, GLsizei height)
    {
        return updateSurface(storage->getSurfaceLevel(level, true), xoffset, yoffset, width, height);
    }
    
    bool Image::updateSurface(TextureStorageCubeMap *storage, int face, int level, GLint xoffset, GLint yoffset, GLsizei width, GLsizei height)
    {
        return updateSurface(storage->getCubeMapSurface(GL_TEXTURE_CUBE_MAP_POSITIVE_X + face, level, true), xoffset, yoffset, width, height);
    }
    
    bool Image::updateSurface(IDirect3DSurface9 *destSurface, GLint xoffset, GLint yoffset, GLsizei width, GLsizei height)
    {
        if (!destSurface)
            return false;
    
        IDirect3DSurface9 *sourceSurface = getSurface();
    
        if (sourceSurface && sourceSurface != destSurface)
        {
            RECT rect;
            rect.left = xoffset;
            rect.top = yoffset;
            rect.right = xoffset + width;
            rect.bottom = yoffset + height;
    
            POINT point = {rect.left, rect.top};
    
            IDirect3DDevice9 *device = mRenderer->getDevice(); // D3D9_REPLACE
    
            if (mD3DPool == D3DPOOL_MANAGED)
            {
                D3DSURFACE_DESC desc;
                sourceSurface->GetDesc(&desc);
    
                IDirect3DSurface9 *surf = 0;
                HRESULT result = device->CreateOffscreenPlainSurface(desc.Width, desc.Height, desc.Format, D3DPOOL_SYSTEMMEM, &surf, NULL);
    
                if (SUCCEEDED(result))
                {
                    CopyLockableSurfaces(surf, sourceSurface);
                    result = device->UpdateSurface(surf, &rect, destSurface, &point);
                    ASSERT(SUCCEEDED(result));
                    surf->Release();
                }
            }
            else
            {
                // UpdateSurface: source must be SYSTEMMEM, dest must be DEFAULT pools 
                HRESULT result = device->UpdateSurface(sourceSurface, &rect, destSurface, &point);
                ASSERT(SUCCEEDED(result));
            }
        }
    
        destSurface->Release();
        return true;
    }
    
    // Store the pixel rectangle designated by xoffset,yoffset,width,height with pixels stored as format/type at input
    // into the target pixel rectangle.
    void Image::loadData(GLint xoffset, GLint yoffset, GLsizei width, GLsizei height,
                         GLint unpackAlignment, const void *input)
    {
        RECT lockRect =
        {
            xoffset, yoffset,
            xoffset + width, yoffset + height
        };
    
        D3DLOCKED_RECT locked;
        HRESULT result = lock(&locked, &lockRect);
        if (FAILED(result))
        {
            return;
        }
    
    
        GLsizei inputPitch = gl::ComputePitch(width, mInternalFormat, unpackAlignment);
    
        switch (mInternalFormat)
        {
          case GL_ALPHA8_EXT:
            if (gl::supportsSSE2())
            {
                loadAlphaDataSSE2(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            }
            else
            {
                loadAlphaData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            }
            break;
          case GL_LUMINANCE8_EXT:
            loadLuminanceData(width, height, inputPitch, input, locked.Pitch, locked.pBits, getD3DFormat() == D3DFMT_L8);
            break;
          case GL_ALPHA32F_EXT:
            loadAlphaFloatData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_LUMINANCE32F_EXT:
            loadLuminanceFloatData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_ALPHA16F_EXT:
            loadAlphaHalfFloatData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_LUMINANCE16F_EXT:
            loadLuminanceHalfFloatData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_LUMINANCE8_ALPHA8_EXT:
            loadLuminanceAlphaData(width, height, inputPitch, input, locked.Pitch, locked.pBits, getD3DFormat() == D3DFMT_A8L8);
            break;
          case GL_LUMINANCE_ALPHA32F_EXT:
            loadLuminanceAlphaFloatData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_LUMINANCE_ALPHA16F_EXT:
            loadLuminanceAlphaHalfFloatData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_RGB8_OES:
            loadRGBUByteData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_RGB565:
            loadRGB565Data(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_RGBA8_OES:
            if (gl::supportsSSE2())
            {
                loadRGBAUByteDataSSE2(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            }
            else
            {
                loadRGBAUByteData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            }
            break;
          case GL_RGBA4:
            loadRGBA4444Data(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_RGB5_A1:
            loadRGBA5551Data(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_BGRA8_EXT:
            loadBGRAData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          // float textures are converted to RGBA, not BGRA, as they're stored that way in D3D
          case GL_RGB32F_EXT:
            loadRGBFloatData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_RGB16F_EXT:
            loadRGBHalfFloatData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_RGBA32F_EXT:
            loadRGBAFloatData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          case GL_RGBA16F_EXT:
            loadRGBAHalfFloatData(width, height, inputPitch, input, locked.Pitch, locked.pBits);
            break;
          default: UNREACHABLE(); 
        }
    
        unlock();
    }
    
    void Image::loadAlphaData(GLsizei width, GLsizei height,
                              int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned char *source = NULL;
        unsigned char *dest = NULL;
        
        for (int y = 0; y < height; y++)
        {
            source = static_cast<const unsigned char*>(input) + y * inputPitch;
            dest = static_cast<unsigned char*>(output) + y * outputPitch;
            for (int x = 0; x < width; x++)
            {
                dest[4 * x + 0] = 0;
                dest[4 * x + 1] = 0;
                dest[4 * x + 2] = 0;
                dest[4 * x + 3] = source[x];
            }
        }
    }
    
    void Image::loadAlphaFloatData(GLsizei width, GLsizei height,
                                   int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const float *source = NULL;
        float *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const float*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = reinterpret_cast<float*>(static_cast<unsigned char*>(output) + y * outputPitch);
            for (int x = 0; x < width; x++)
            {
                dest[4 * x + 0] = 0;
                dest[4 * x + 1] = 0;
                dest[4 * x + 2] = 0;
                dest[4 * x + 3] = source[x];
            }
        }
    }
    
    void Image::loadAlphaHalfFloatData(GLsizei width, GLsizei height,
                                       int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned short *source = NULL;
        unsigned short *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const unsigned short*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = reinterpret_cast<unsigned short*>(static_cast<unsigned char*>(output) + y * outputPitch);
            for (int x = 0; x < width; x++)
            {
                dest[4 * x + 0] = 0;
                dest[4 * x + 1] = 0;
                dest[4 * x + 2] = 0;
                dest[4 * x + 3] = source[x];
            }
        }
    }
    
    void Image::loadLuminanceData(GLsizei width, GLsizei height,
                                  int inputPitch, const void *input, size_t outputPitch, void *output, bool native) const
    {
        const unsigned char *source = NULL;
        unsigned char *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = static_cast<const unsigned char*>(input) + y * inputPitch;
            dest = static_cast<unsigned char*>(output) + y * outputPitch;
    
            if (!native)   // BGRA8 destination format
            {
                for (int x = 0; x < width; x++)
                {
                    dest[4 * x + 0] = source[x];
                    dest[4 * x + 1] = source[x];
                    dest[4 * x + 2] = source[x];
                    dest[4 * x + 3] = 0xFF;
                }
            }
            else   // L8 destination format
            {
                memcpy(dest, source, width);
            }
        }
    }
    
    void Image::loadLuminanceFloatData(GLsizei width, GLsizei height,
                                       int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const float *source = NULL;
        float *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const float*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = reinterpret_cast<float*>(static_cast<unsigned char*>(output) + y * outputPitch);
            for (int x = 0; x < width; x++)
            {
                dest[4 * x + 0] = source[x];
                dest[4 * x + 1] = source[x];
                dest[4 * x + 2] = source[x];
                dest[4 * x + 3] = 1.0f;
            }
        }
    }
    
    void Image::loadLuminanceHalfFloatData(GLsizei width, GLsizei height,
                                           int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned short *source = NULL;
        unsigned short *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const unsigned short*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = reinterpret_cast<unsigned short*>(static_cast<unsigned char*>(output) + y * outputPitch);
            for (int x = 0; x < width; x++)
            {
                dest[4 * x + 0] = source[x];
                dest[4 * x + 1] = source[x];
                dest[4 * x + 2] = source[x];
                dest[4 * x + 3] = 0x3C00; // SEEEEEMMMMMMMMMM, S = 0, E = 15, M = 0: 16bit flpt representation of 1
            }
        }
    }
    
    void Image::loadLuminanceAlphaData(GLsizei width, GLsizei height,
                                       int inputPitch, const void *input, size_t outputPitch, void *output, bool native) const
    {
        const unsigned char *source = NULL;
        unsigned char *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = static_cast<const unsigned char*>(input) + y * inputPitch;
            dest = static_cast<unsigned char*>(output) + y * outputPitch;
            
            if (!native)   // BGRA8 destination format
            {
                for (int x = 0; x < width; x++)
                {
                    dest[4 * x + 0] = source[2*x+0];
                    dest[4 * x + 1] = source[2*x+0];
                    dest[4 * x + 2] = source[2*x+0];
                    dest[4 * x + 3] = source[2*x+1];
                }
            }
            else
            {
                memcpy(dest, source, width * 2);
            }
        }
    }
    
    void Image::loadLuminanceAlphaFloatData(GLsizei width, GLsizei height,
                                            int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const float *source = NULL;
        float *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const float*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = reinterpret_cast<float*>(static_cast<unsigned char*>(output) + y * outputPitch);
            for (int x = 0; x < width; x++)
            {
                dest[4 * x + 0] = source[2*x+0];
                dest[4 * x + 1] = source[2*x+0];
                dest[4 * x + 2] = source[2*x+0];
                dest[4 * x + 3] = source[2*x+1];
            }
        }
    }
    
    void Image::loadLuminanceAlphaHalfFloatData(GLsizei width, GLsizei height,
                                                int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned short *source = NULL;
        unsigned short *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const unsigned short*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = reinterpret_cast<unsigned short*>(static_cast<unsigned char*>(output) + y * outputPitch);
            for (int x = 0; x < width; x++)
            {
                dest[4 * x + 0] = source[2*x+0];
                dest[4 * x + 1] = source[2*x+0];
                dest[4 * x + 2] = source[2*x+0];
                dest[4 * x + 3] = source[2*x+1];
            }
        }
    }
    
    void Image::loadRGBUByteData(GLsizei width, GLsizei height,
                                 int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned char *source = NULL;
        unsigned char *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = static_cast<const unsigned char*>(input) + y * inputPitch;
            dest = static_cast<unsigned char*>(output) + y * outputPitch;
            for (int x = 0; x < width; x++)
            {
                dest[4 * x + 0] = source[x * 3 + 2];
                dest[4 * x + 1] = source[x * 3 + 1];
                dest[4 * x + 2] = source[x * 3 + 0];
                dest[4 * x + 3] = 0xFF;
            }
        }
    }
    
    void Image::loadRGB565Data(GLsizei width, GLsizei height,
                               int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned short *source = NULL;
        unsigned char *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const unsigned short*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = static_cast<unsigned char*>(output) + y * outputPitch;
            for (int x = 0; x < width; x++)
            {
                unsigned short rgba = source[x];
                dest[4 * x + 0] = ((rgba & 0x001F) << 3) | ((rgba & 0x001F) >> 2);
                dest[4 * x + 1] = ((rgba & 0x07E0) >> 3) | ((rgba & 0x07E0) >> 9);
                dest[4 * x + 2] = ((rgba & 0xF800) >> 8) | ((rgba & 0xF800) >> 13);
                dest[4 * x + 3] = 0xFF;
            }
        }
    }
    
    void Image::loadRGBFloatData(GLsizei width, GLsizei height,
                                 int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const float *source = NULL;
        float *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const float*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = reinterpret_cast<float*>(static_cast<unsigned char*>(output) + y * outputPitch);
            for (int x = 0; x < width; x++)
            {
                dest[4 * x + 0] = source[x * 3 + 0];
                dest[4 * x + 1] = source[x * 3 + 1];
                dest[4 * x + 2] = source[x * 3 + 2];
                dest[4 * x + 3] = 1.0f;
            }
        }
    }
    
    void Image::loadRGBHalfFloatData(GLsizei width, GLsizei height,
                                     int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned short *source = NULL;
        unsigned short *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const unsigned short*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = reinterpret_cast<unsigned short*>(static_cast<unsigned char*>(output) + y * outputPitch);
            for (int x = 0; x < width; x++)
            {
                dest[4 * x + 0] = source[x * 3 + 0];
                dest[4 * x + 1] = source[x * 3 + 1];
                dest[4 * x + 2] = source[x * 3 + 2];
                dest[4 * x + 3] = 0x3C00; // SEEEEEMMMMMMMMMM, S = 0, E = 15, M = 0: 16bit flpt representation of 1
            }
        }
    }
    
    void Image::loadRGBAUByteData(GLsizei width, GLsizei height,
                                  int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned int *source = NULL;
        unsigned int *dest = NULL;
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const unsigned int*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = reinterpret_cast<unsigned int*>(static_cast<unsigned char*>(output) + y * outputPitch);
    
            for (int x = 0; x < width; x++)
            {
                unsigned int rgba = source[x];
                dest[x] = (_rotl(rgba, 16) & 0x00ff00ff) | (rgba & 0xff00ff00);
            }
        }
    }
    
    void Image::loadRGBA4444Data(GLsizei width, GLsizei height,
                                 int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned short *source = NULL;
        unsigned char *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const unsigned short*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = static_cast<unsigned char*>(output) + y * outputPitch;
            for (int x = 0; x < width; x++)
            {
                unsigned short rgba = source[x];
                dest[4 * x + 0] = ((rgba & 0x00F0) << 0) | ((rgba & 0x00F0) >> 4);
                dest[4 * x + 1] = ((rgba & 0x0F00) >> 4) | ((rgba & 0x0F00) >> 8);
                dest[4 * x + 2] = ((rgba & 0xF000) >> 8) | ((rgba & 0xF000) >> 12);
                dest[4 * x + 3] = ((rgba & 0x000F) << 4) | ((rgba & 0x000F) >> 0);
            }
        }
    }
    
    void Image::loadRGBA5551Data(GLsizei width, GLsizei height,
                                 int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned short *source = NULL;
        unsigned char *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const unsigned short*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = static_cast<unsigned char*>(output) + y * outputPitch;
            for (int x = 0; x < width; x++)
            {
                unsigned short rgba = source[x];
                dest[4 * x + 0] = ((rgba & 0x003E) << 2) | ((rgba & 0x003E) >> 3);
                dest[4 * x + 1] = ((rgba & 0x07C0) >> 3) | ((rgba & 0x07C0) >> 8);
                dest[4 * x + 2] = ((rgba & 0xF800) >> 8) | ((rgba & 0xF800) >> 13);
                dest[4 * x + 3] = (rgba & 0x0001) ? 0xFF : 0;
            }
        }
    }
    
    void Image::loadRGBAFloatData(GLsizei width, GLsizei height,
                                  int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const float *source = NULL;
        float *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = reinterpret_cast<const float*>(static_cast<const unsigned char*>(input) + y * inputPitch);
            dest = reinterpret_cast<float*>(static_cast<unsigned char*>(output) + y * outputPitch);
            memcpy(dest, source, width * 16);
        }
    }
    
    void Image::loadRGBAHalfFloatData(GLsizei width, GLsizei height,
                                      int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned char *source = NULL;
        unsigned char *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = static_cast<const unsigned char*>(input) + y * inputPitch;
            dest = static_cast<unsigned char*>(output) + y * outputPitch;
            memcpy(dest, source, width * 8);
        }
    }
    
    void Image::loadBGRAData(GLsizei width, GLsizei height,
                             int inputPitch, const void *input, size_t outputPitch, void *output) const
    {
        const unsigned char *source = NULL;
        unsigned char *dest = NULL;
    
        for (int y = 0; y < height; y++)
        {
            source = static_cast<const unsigned char*>(input) + y * inputPitch;
            dest = static_cast<unsigned char*>(output) + y * outputPitch;
            memcpy(dest, source, width*4);
        }
    }
    
    void Image::loadCompressedData(GLint xoffset, GLint yoffset, GLsizei width, GLsizei height,
                                   const void *input) {
        ASSERT(xoffset % 4 == 0);
        ASSERT(yoffset % 4 == 0);
    
        RECT lockRect = {
            xoffset, yoffset,
            xoffset + width, yoffset + height
        };
    
        D3DLOCKED_RECT locked;
        HRESULT result = lock(&locked, &lockRect);
        if (FAILED(result))
        {
            return;
        }
    
        GLsizei inputSize = gl::ComputeCompressedSize(width, height, mInternalFormat);
        GLsizei inputPitch = gl::ComputeCompressedPitch(width, mInternalFormat);
        int rows = inputSize / inputPitch;
        for (int i = 0; i < rows; ++i)
        {
            memcpy((void*)((BYTE*)locked.pBits + i * locked.Pitch), (void*)((BYTE*)input + i * inputPitch), inputPitch);
        }
    
        unlock();
    }
    
    // This implements glCopyTex[Sub]Image2D for non-renderable internal texture formats and incomplete textures
    void Image::copy(GLint xoffset, GLint yoffset, GLint x, GLint y, GLsizei width, GLsizei height, gl::Framebuffer *source)
    {
        RenderTarget9 *renderTarget = NULL;
        IDirect3DSurface9 *surface = NULL;
        gl::Renderbuffer *colorbuffer = source->getColorbuffer();
    
        if (colorbuffer)
        {
            renderTarget = RenderTarget9::makeRenderTarget9(colorbuffer->getRenderTarget());
        }
        
        if (renderTarget)
        {
            surface = renderTarget->getSurface();
        }
    
        if (!surface)
        {
            ERR("Failed to retrieve the render target.");
            return error(GL_OUT_OF_MEMORY);
        }
    
        IDirect3DDevice9 *device = mRenderer->getDevice(); // D3D9_REPLACE
    
        IDirect3DSurface9 *renderTargetData = NULL;
        D3DSURFACE_DESC description;
        surface->GetDesc(&description);
        
        HRESULT result = device->CreateOffscreenPlainSurface(description.Width, description.Height, description.Format, D3DPOOL_SYSTEMMEM, &renderTargetData, NULL);
    
        if (FAILED(result))
        {
            ERR("Could not create matching destination surface.");
            surface->Release();
            return error(GL_OUT_OF_MEMORY);
        }
    
        result = device->GetRenderTargetData(surface, renderTargetData);
    
        if (FAILED(result))
        {
            ERR("GetRenderTargetData unexpectedly failed.");
            renderTargetData->Release();
            surface->Release();
            return error(GL_OUT_OF_MEMORY);
        }
    
        RECT sourceRect = {x, y, x + width, y + height};
        RECT destRect = {xoffset, yoffset, xoffset + width, yoffset + height};
    
        D3DLOCKED_RECT sourceLock = {0};
        result = renderTargetData->LockRect(&sourceLock, &sourceRect, 0);
    
        if (FAILED(result))
        {
            ERR("Failed to lock the source surface (rectangle might be invalid).");
            renderTargetData->Release();
            surface->Release();
            return error(GL_OUT_OF_MEMORY);
        }
    
        D3DLOCKED_RECT destLock = {0};
        result = lock(&destLock, &destRect);
        
        if (FAILED(result))
        {
            ERR("Failed to lock the destination surface (rectangle might be invalid).");
            renderTargetData->UnlockRect();
            renderTargetData->Release();
            surface->Release();
            return error(GL_OUT_OF_MEMORY);
        }
    
        if (destLock.pBits && sourceLock.pBits)
        {
            unsigned char *source = (unsigned char*)sourceLock.pBits;
            unsigned char *dest = (unsigned char*)destLock.pBits;
    
            switch (description.Format)
            {
              case D3DFMT_X8R8G8B8:
              case D3DFMT_A8R8G8B8:
                switch(getD3DFormat())
                {
                  case D3DFMT_X8R8G8B8:
                  case D3DFMT_A8R8G8B8:
                    for(int y = 0; y < height; y++)
                    {
                        memcpy(dest, source, 4 * width);
    
                        source += sourceLock.Pitch;
                        dest += destLock.Pitch;
                    }
                    break;
                  case D3DFMT_L8:
                    for(int y = 0; y < height; y++)
                    {
                        for(int x = 0; x < width; x++)
                        {
                            dest[x] = source[x * 4 + 2];
                        }
    
                        source += sourceLock.Pitch;
                        dest += destLock.Pitch;
                    }
                    break;
                  case D3DFMT_A8L8:
                    for(int y = 0; y < height; y++)
                    {
                        for(int x = 0; x < width; x++)
                        {
                            dest[x * 2 + 0] = source[x * 4 + 2];
                            dest[x * 2 + 1] = source[x * 4 + 3];
                        }
    
                        source += sourceLock.Pitch;
                        dest += destLock.Pitch;
                    }
                    break;
                  default:
                    UNREACHABLE();
                }
                break;
              case D3DFMT_R5G6B5:
                switch(getD3DFormat())
                {
                  case D3DFMT_X8R8G8B8:
                    for(int y = 0; y < height; y++)
                    {
                        for(int x = 0; x < width; x++)
                        {
                            unsigned short rgb = ((unsigned short*)source)[x];
                            unsigned char red = (rgb & 0xF800) >> 8;
                            unsigned char green = (rgb & 0x07E0) >> 3;
                            unsigned char blue = (rgb & 0x001F) << 3;
                            dest[x + 0] = blue | (blue >> 5);
                            dest[x + 1] = green | (green >> 6);
                            dest[x + 2] = red | (red >> 5);
                            dest[x + 3] = 0xFF;
                        }
    
                        source += sourceLock.Pitch;
                        dest += destLock.Pitch;
                    }
                    break;
                  case D3DFMT_L8:
                    for(int y = 0; y < height; y++)
                    {
                        for(int x = 0; x < width; x++)
                        {
                            unsigned char red = source[x * 2 + 1] & 0xF8;
                            dest[x] = red | (red >> 5);
                        }
    
                        source += sourceLock.Pitch;
                        dest += destLock.Pitch;
                    }
                    break;
                  default:
                    UNREACHABLE();
                }
                break;
              case D3DFMT_A1R5G5B5:
                switch(getD3DFormat())
                {
                  case D3DFMT_X8R8G8B8:
                    for(int y = 0; y < height; y++)
                    {
                        for(int x = 0; x < width; x++)
                        {
                            unsigned short argb = ((unsigned short*)source)[x];
                            unsigned char red = (argb & 0x7C00) >> 7;
                            unsigned char green = (argb & 0x03E0) >> 2;
                            unsigned char blue = (argb & 0x001F) << 3;
                            dest[x + 0] = blue | (blue >> 5);
                            dest[x + 1] = green | (green >> 5);
                            dest[x + 2] = red | (red >> 5);
                            dest[x + 3] = 0xFF;
                        }
    
                        source += sourceLock.Pitch;
                        dest += destLock.Pitch;
                    }
                    break;
                  case D3DFMT_A8R8G8B8:
                    for(int y = 0; y < height; y++)
                    {
                        for(int x = 0; x < width; x++)
                        {
                            unsigned short argb = ((unsigned short*)source)[x];
                            unsigned char red = (argb & 0x7C00) >> 7;
                            unsigned char green = (argb & 0x03E0) >> 2;
                            unsigned char blue = (argb & 0x001F) << 3;
                            unsigned char alpha = (signed short)argb >> 15;
                            dest[x + 0] = blue | (blue >> 5);
                            dest[x + 1] = green | (green >> 5);
                            dest[x + 2] = red | (red >> 5);
                            dest[x + 3] = alpha;
                        }
    
                        source += sourceLock.Pitch;
                        dest += destLock.Pitch;
                    }
                    break;
                  case D3DFMT_L8:
                    for(int y = 0; y < height; y++)
                    {
                        for(int x = 0; x < width; x++)
                        {
                            unsigned char red = source[x * 2 + 1] & 0x7C;
                            dest[x] = (red << 1) | (red >> 4);
                        }
    
                        source += sourceLock.Pitch;
                        dest += destLock.Pitch;
                    }
                    break;
                  case D3DFMT_A8L8:
                    for(int y = 0; y < height; y++)
                    {
                        for(int x = 0; x < width; x++)
                        {
                            unsigned char red = source[x * 2 + 1] & 0x7C;
                            dest[x * 2 + 0] = (red << 1) | (red >> 4);
                            dest[x * 2 + 1] = (signed char)source[x * 2 + 1] >> 7;
                        }
    
                        source += sourceLock.Pitch;
                        dest += destLock.Pitch;
                    }
                    break;
                  default:
                    UNREACHABLE();
                }
                break;
              default:
                UNREACHABLE();
            }
        }
    
        unlock();
        renderTargetData->UnlockRect();
    
        renderTargetData->Release();
        surface->Release();
    
        mDirty = true;
    }
    
    }