rsAllocation.cpp revision 37bf79153942f9cb0ce1ad1a69c4a345fa3c8806
1/*
2 * Copyright (C) 2009 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 *      http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "rsContext.h"
18
19#include <GLES/gl.h>
20#include <GLES/glext.h>
21
22using namespace android;
23using namespace android::renderscript;
24
25Allocation::Allocation(Context *rsc, const Type *type) : ObjectBase(rsc)
26{
27    mAllocFile = __FILE__;
28    mAllocLine = __LINE__;
29    mPtr = NULL;
30
31    mCpuWrite = false;
32    mCpuRead = false;
33    mGpuWrite = false;
34    mGpuRead = false;
35
36    mReadWriteRatio = 0;
37    mUpdateSize = 0;
38
39    mIsTexture = false;
40    mTextureID = 0;
41
42    mIsVertexBuffer = false;
43    mBufferID = 0;
44
45    mType.set(type);
46    rsAssert(type);
47    mPtr = malloc(mType->getSizeBytes());
48    if (!mPtr) {
49        LOGE("Allocation::Allocation, alloc failure");
50    }
51}
52
53Allocation::~Allocation()
54{
55}
56
57void Allocation::setCpuWritable(bool)
58{
59}
60
61void Allocation::setGpuWritable(bool)
62{
63}
64
65void Allocation::setCpuReadable(bool)
66{
67}
68
69void Allocation::setGpuReadable(bool)
70{
71}
72
73bool Allocation::fixAllocation()
74{
75    return false;
76}
77
78void Allocation::uploadToTexture(uint32_t lodOffset)
79{
80    //rsAssert(!mTextureId);
81    rsAssert(lodOffset < mType->getLODCount());
82
83    GLenum type = mType->getElement()->getGLType();
84    GLenum format = mType->getElement()->getGLFormat();
85
86    if (!type || !format) {
87        return;
88    }
89
90    if (!mTextureID) {
91        glGenTextures(1, &mTextureID);
92    }
93    glBindTexture(GL_TEXTURE_2D, mTextureID);
94
95    Adapter2D adapt(getContext(), this);
96    for(uint32_t lod = 0; (lod + lodOffset) < mType->getLODCount(); lod++) {
97        adapt.setLOD(lod+lodOffset);
98
99        uint16_t * ptr = static_cast<uint16_t *>(adapt.getElement(0,0));
100        glTexImage2D(GL_TEXTURE_2D, lod, format,
101                     adapt.getDimX(), adapt.getDimY(),
102                     0, format, type, ptr);
103    }
104}
105
106void Allocation::uploadToBufferObject()
107{
108    rsAssert(!mType->getDimY());
109    rsAssert(!mType->getDimZ());
110
111    if (!mBufferID) {
112        glGenBuffers(1, &mBufferID);
113    }
114    glBindBuffer(GL_ARRAY_BUFFER, mBufferID);
115    glBufferData(GL_ARRAY_BUFFER, mType->getSizeBytes(), getPtr(), GL_DYNAMIC_DRAW);
116    glBindBuffer(GL_ARRAY_BUFFER, 0);
117}
118
119
120void Allocation::data(const void *data, uint32_t sizeBytes)
121{
122    uint32_t size = mType->getSizeBytes();
123    if (size != sizeBytes) {
124        LOGE("Allocation::data called with mismatched size expected %i, got %i", size, sizeBytes);
125        return;
126    }
127    memcpy(mPtr, data, size);
128    sendDirty();
129}
130
131void Allocation::read(void *data)
132{
133    memcpy(data, mPtr, mType->getSizeBytes());
134}
135
136void Allocation::subData(uint32_t xoff, uint32_t count, const void *data, uint32_t sizeBytes)
137{
138    uint32_t eSize = mType->getElementSizeBytes();
139    uint8_t * ptr = static_cast<uint8_t *>(mPtr);
140    ptr += eSize * xoff;
141    uint32_t size = count * eSize;
142
143    if (size != sizeBytes) {
144        LOGE("Allocation::subData called with mismatched size expected %i, got %i", size, sizeBytes);
145        mType->dumpLOGV("type info");
146        return;
147    }
148    memcpy(ptr, data, size);
149    sendDirty();
150}
151
152void Allocation::subData(uint32_t xoff, uint32_t yoff,
153             uint32_t w, uint32_t h, const void *data, uint32_t sizeBytes)
154{
155    uint32_t eSize = mType->getElementSizeBytes();
156    uint32_t lineSize = eSize * w;
157    uint32_t destW = mType->getDimX();
158
159    const uint8_t *src = static_cast<const uint8_t *>(data);
160    uint8_t *dst = static_cast<uint8_t *>(mPtr);
161    dst += eSize * (xoff + yoff * destW);
162
163    if ((lineSize * eSize * h) != sizeBytes) {
164        rsAssert(!"Allocation::subData called with mismatched size");
165        return;
166    }
167
168    for (uint32_t line=yoff; line < (yoff+h); line++) {
169        uint8_t * ptr = static_cast<uint8_t *>(mPtr);
170        memcpy(dst, src, lineSize);
171        src += lineSize;
172        dst += destW * eSize;
173    }
174    sendDirty();
175}
176
177void Allocation::subData(uint32_t xoff, uint32_t yoff, uint32_t zoff,
178             uint32_t w, uint32_t h, uint32_t d, const void *data, uint32_t sizeBytes)
179{
180}
181
182void Allocation::addProgramToDirty(const Program *p)
183{
184    mToDirtyList.add(p);
185}
186
187void Allocation::removeProgramToDirty(const Program *p)
188{
189    for (size_t ct=0; ct < mToDirtyList.size(); ct++) {
190        if (mToDirtyList[ct] == p) {
191            mToDirtyList.removeAt(ct);
192            return;
193        }
194    }
195    rsAssert(0);
196}
197
198void Allocation::sendDirty() const
199{
200    for (size_t ct=0; ct < mToDirtyList.size(); ct++) {
201        mToDirtyList[ct]->forceDirty();
202    }
203}
204
205/////////////////
206//
207
208
209namespace android {
210namespace renderscript {
211
212RsAllocation rsi_AllocationCreateTyped(Context *rsc, RsType vtype)
213{
214    const Type * type = static_cast<const Type *>(vtype);
215
216    Allocation * alloc = new Allocation(rsc, type);
217    alloc->incUserRef();
218    return alloc;
219}
220
221RsAllocation rsi_AllocationCreateSized(Context *rsc, RsElement e, size_t count)
222{
223    Type * type = new Type(rsc);
224    type->setDimX(count);
225    type->setElement(static_cast<Element *>(e));
226    type->compute();
227    return rsi_AllocationCreateTyped(rsc, type);
228}
229
230void rsi_AllocationUploadToTexture(Context *rsc, RsAllocation va, uint32_t baseMipLevel)
231{
232    Allocation *alloc = static_cast<Allocation *>(va);
233    alloc->uploadToTexture(baseMipLevel);
234}
235
236void rsi_AllocationUploadToBufferObject(Context *rsc, RsAllocation va)
237{
238    Allocation *alloc = static_cast<Allocation *>(va);
239    alloc->uploadToBufferObject();
240}
241
242static void mip565(const Adapter2D &out, const Adapter2D &in)
243{
244    uint32_t w = out.getDimX();
245    uint32_t h = out.getDimY();
246
247    for (uint32_t y=0; y < h; y++) {
248        uint16_t *oPtr = static_cast<uint16_t *>(out.getElement(0, y));
249        const uint16_t *i1 = static_cast<uint16_t *>(in.getElement(0, y*2));
250        const uint16_t *i2 = static_cast<uint16_t *>(in.getElement(0, y*2+1));
251
252        for (uint32_t x=0; x < w; x++) {
253            *oPtr = rsBoxFilter565(i1[0], i1[1], i2[0], i2[1]);
254            oPtr ++;
255            i1 += 2;
256            i2 += 2;
257        }
258    }
259}
260
261static void mip8888(const Adapter2D &out, const Adapter2D &in)
262{
263    uint32_t w = out.getDimX();
264    uint32_t h = out.getDimY();
265
266    for (uint32_t y=0; y < h; y++) {
267        uint32_t *oPtr = static_cast<uint32_t *>(out.getElement(0, y));
268        const uint32_t *i1 = static_cast<uint32_t *>(in.getElement(0, y*2));
269        const uint32_t *i2 = static_cast<uint32_t *>(in.getElement(0, y*2+1));
270
271        for (uint32_t x=0; x < w; x++) {
272            *oPtr = rsBoxFilter8888(i1[0], i1[1], i2[0], i2[1]);
273            oPtr ++;
274            i1 += 2;
275            i2 += 2;
276        }
277    }
278}
279
280static void mip(const Adapter2D &out, const Adapter2D &in)
281{
282    switch(out.getBaseType()->getElement()->getSizeBits()) {
283    case 32:
284        mip8888(out, in);
285        break;
286    case 16:
287        mip565(out, in);
288        break;
289
290    }
291
292}
293
294typedef void (*ElementConverter_t)(void *dst, const void *src, uint32_t count);
295
296static void elementConverter_cpy_16(void *dst, const void *src, uint32_t count)
297{
298    memcpy(dst, src, count * 2);
299}
300static void elementConverter_cpy_8(void *dst, const void *src, uint32_t count)
301{
302    memcpy(dst, src, count);
303}
304static void elementConverter_cpy_32(void *dst, const void *src, uint32_t count)
305{
306    memcpy(dst, src, count * 4);
307}
308
309
310static void elementConverter_888_to_565(void *dst, const void *src, uint32_t count)
311{
312    uint16_t *d = static_cast<uint16_t *>(dst);
313    const uint8_t *s = static_cast<const uint8_t *>(src);
314
315    while(count--) {
316        *d = rs888to565(s[0], s[1], s[2]);
317        d++;
318        s+= 3;
319    }
320}
321
322static void elementConverter_8888_to_565(void *dst, const void *src, uint32_t count)
323{
324    uint16_t *d = static_cast<uint16_t *>(dst);
325    const uint8_t *s = static_cast<const uint8_t *>(src);
326
327    while(count--) {
328        *d = rs888to565(s[0], s[1], s[2]);
329        d++;
330        s+= 4;
331    }
332}
333
334static ElementConverter_t pickConverter(const Element *dst, const Element *src)
335{
336    GLenum srcGLType = src->getGLType();
337    GLenum srcGLFmt = src->getGLFormat();
338    GLenum dstGLType = dst->getGLType();
339    GLenum dstGLFmt = dst->getGLFormat();
340
341    if (srcGLFmt == dstGLFmt && srcGLType == dstGLType) {
342        switch(dst->getSizeBytes()) {
343        case 4:
344            return elementConverter_cpy_32;
345        case 2:
346            return elementConverter_cpy_16;
347        case 1:
348            return elementConverter_cpy_8;
349        }
350    }
351
352    if (srcGLType == GL_UNSIGNED_BYTE &&
353        srcGLFmt == GL_RGB &&
354        dstGLType == GL_UNSIGNED_SHORT_5_6_5 &&
355        dstGLType == GL_RGB) {
356
357        return elementConverter_888_to_565;
358    }
359
360    if (srcGLType == GL_UNSIGNED_BYTE &&
361        srcGLFmt == GL_RGBA &&
362        dstGLType == GL_UNSIGNED_SHORT_5_6_5 &&
363        dstGLType == GL_RGB) {
364
365        return elementConverter_8888_to_565;
366    }
367
368    LOGE("pickConverter, unsuported combo, src %p,  dst %p", src, dst);
369    return 0;
370}
371
372
373RsAllocation rsi_AllocationCreateFromBitmap(Context *rsc, uint32_t w, uint32_t h, RsElement _dst, RsElement _src,  bool genMips, const void *data)
374{
375    const Element *src = static_cast<const Element *>(_src);
376    const Element *dst = static_cast<const Element *>(_dst);
377    rsAssert(!(w & (w-1)));
378    rsAssert(!(h & (h-1)));
379
380    //LOGE("rsi_AllocationCreateFromBitmap %i %i %i %i %i", w, h, dstFmt, srcFmt, genMips);
381    rsi_TypeBegin(rsc, _dst);
382    rsi_TypeAdd(rsc, RS_DIMENSION_X, w);
383    rsi_TypeAdd(rsc, RS_DIMENSION_Y, h);
384    if (genMips) {
385        rsi_TypeAdd(rsc, RS_DIMENSION_LOD, 1);
386    }
387    RsType type = rsi_TypeCreate(rsc);
388
389    RsAllocation vTexAlloc = rsi_AllocationCreateTyped(rsc, type);
390    Allocation *texAlloc = static_cast<Allocation *>(vTexAlloc);
391    if (texAlloc == NULL) {
392        LOGE("Memory allocation failure");
393        return NULL;
394    }
395    texAlloc->incUserRef();
396
397    ElementConverter_t cvt = pickConverter(dst, src);
398    cvt(texAlloc->getPtr(), data, w * h);
399
400    if (genMips) {
401        Adapter2D adapt(rsc, texAlloc);
402        Adapter2D adapt2(rsc, texAlloc);
403        for(uint32_t lod=0; lod < (texAlloc->getType()->getLODCount() -1); lod++) {
404            adapt.setLOD(lod);
405            adapt2.setLOD(lod + 1);
406            mip(adapt2, adapt);
407        }
408    }
409
410    return texAlloc;
411}
412
413RsAllocation rsi_AllocationCreateFromBitmapBoxed(Context *rsc, uint32_t w, uint32_t h, RsElement _dst, RsElement _src, bool genMips, const void *data)
414{
415    const Element *srcE = static_cast<const Element *>(_src);
416    const Element *dstE = static_cast<const Element *>(_dst);
417    uint32_t w2 = rsHigherPow2(w);
418    uint32_t h2 = rsHigherPow2(h);
419
420    if ((w2 == w) && (h2 == h)) {
421        return rsi_AllocationCreateFromBitmap(rsc, w, h, _dst, _src, genMips, data);
422    }
423
424    uint32_t bpp = srcE->getSizeBytes();
425    size_t size = w2 * h2 * bpp;
426    uint8_t *tmp = static_cast<uint8_t *>(malloc(size));
427    memset(tmp, 0, size);
428
429    const uint8_t * src = static_cast<const uint8_t *>(data);
430    for (uint32_t y = 0; y < h; y++) {
431        uint8_t * ydst = &tmp[(y + ((h2 - h) >> 1)) * w2 * bpp];
432        memcpy(&ydst[((w2 - w) >> 1) * bpp], src, w * bpp);
433        src += w * bpp;
434    }
435
436    RsAllocation ret = rsi_AllocationCreateFromBitmap(rsc, w2, h2, _dst, _src, genMips, tmp);
437    free(tmp);
438    return ret;
439}
440
441void rsi_AllocationData(Context *rsc, RsAllocation va, const void *data, uint32_t sizeBytes)
442{
443    Allocation *a = static_cast<Allocation *>(va);
444    a->data(data, sizeBytes);
445}
446
447void rsi_Allocation1DSubData(Context *rsc, RsAllocation va, uint32_t xoff, uint32_t count, const void *data, uint32_t sizeBytes)
448{
449    Allocation *a = static_cast<Allocation *>(va);
450    a->subData(xoff, count, data, sizeBytes);
451}
452
453void rsi_Allocation2DSubData(Context *rsc, RsAllocation va, uint32_t xoff, uint32_t yoff, uint32_t w, uint32_t h, const void *data, uint32_t sizeBytes)
454{
455    Allocation *a = static_cast<Allocation *>(va);
456    a->subData(xoff, yoff, w, h, data, sizeBytes);
457}
458
459void rsi_AllocationRead(Context *rsc, RsAllocation va, void *data)
460{
461    Allocation *a = static_cast<Allocation *>(va);
462    a->read(data);
463}
464
465
466}
467}
468