| /* |
| * Copyright (C) 2013 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| |
| #include "rsCpuIntrinsic.h" |
| #include "rsCpuIntrinsicInlines.h" |
| |
| #ifndef RS_COMPATIBILITY_LIB |
| #include "hardware/gralloc.h" |
| #endif |
| |
| using namespace android; |
| using namespace android::renderscript; |
| |
| namespace android { |
| namespace renderscript { |
| |
| |
| class RsdCpuScriptIntrinsicYuvToRGB : public RsdCpuScriptIntrinsic { |
| public: |
| virtual void populateScript(Script *); |
| virtual void invokeFreeChildren(); |
| |
| virtual void setGlobalObj(uint32_t slot, ObjectBase *data); |
| |
| virtual ~RsdCpuScriptIntrinsicYuvToRGB(); |
| RsdCpuScriptIntrinsicYuvToRGB(RsdCpuReferenceImpl *ctx, const Script *s, const Element *e); |
| |
| protected: |
| ObjectBaseRef<Allocation> alloc; |
| |
| static void kernel(const RsForEachStubParamStruct *p, |
| uint32_t xstart, uint32_t xend, |
| uint32_t instep, uint32_t outstep); |
| }; |
| |
| } |
| } |
| |
| |
| void RsdCpuScriptIntrinsicYuvToRGB::setGlobalObj(uint32_t slot, ObjectBase *data) { |
| rsAssert(slot == 0); |
| alloc.set(static_cast<Allocation *>(data)); |
| } |
| |
| |
| |
| |
| static uchar4 rsYuvToRGBA_uchar4(uchar y, uchar u, uchar v) { |
| short Y = ((short)y) - 16; |
| short U = ((short)u) - 128; |
| short V = ((short)v) - 128; |
| |
| short4 p; |
| p.x = (Y * 298 + V * 409 + 128) >> 8; |
| p.y = (Y * 298 - U * 100 - V * 208 + 128) >> 8; |
| p.z = (Y * 298 + U * 516 + 128) >> 8; |
| p.w = 255; |
| if(p.x < 0) { |
| p.x = 0; |
| } |
| if(p.x > 255) { |
| p.x = 255; |
| } |
| if(p.y < 0) { |
| p.y = 0; |
| } |
| if(p.y > 255) { |
| p.y = 255; |
| } |
| if(p.z < 0) { |
| p.z = 0; |
| } |
| if(p.z > 255) { |
| p.z = 255; |
| } |
| |
| return (uchar4){p.x, p.y, p.z, p.w}; |
| } |
| |
| |
| static short YuvCoeff[] = { |
| 298, 409, -100, 516, -208, 255, 0, 0, |
| 16, 16, 16, 16, 16, 16, 16, 16, |
| 128, 128, 128, 128, 128, 128, 128, 128, |
| 298, 298, 298, 298, 298, 298, 298, 298, |
| 255, 255, 255, 255, 255, 255, 255, 255 |
| |
| |
| }; |
| |
| extern "C" void rsdIntrinsicYuv_K(void *dst, const uchar *Y, const uchar *uv, uint32_t count, const short *param); |
| extern "C" void rsdIntrinsicYuv2_K(void *dst, const uchar *Y, const uchar *u, const uchar *v, uint32_t count, const short *param); |
| |
| void RsdCpuScriptIntrinsicYuvToRGB::kernel(const RsForEachStubParamStruct *p, |
| uint32_t xstart, uint32_t xend, |
| uint32_t instep, uint32_t outstep) { |
| RsdCpuScriptIntrinsicYuvToRGB *cp = (RsdCpuScriptIntrinsicYuvToRGB *)p->usr; |
| if (!cp->alloc.get()) { |
| ALOGE("YuvToRGB executed without input, skipping"); |
| return; |
| } |
| const uchar *pinY = (const uchar *)cp->alloc->mHal.drvState.lod[0].mallocPtr; |
| const size_t strideY = cp->alloc->mHal.drvState.lod[0].stride; |
| const uchar *Y = pinY + (p->y * strideY); |
| |
| uchar4 *out = (uchar4 *)p->out; |
| uint32_t x1 = xstart; |
| uint32_t x2 = xend; |
| |
| switch (cp->alloc->mHal.state.yuv) { |
| // In API 17 there was no yuv format and the intrinsic treated everything as NV21 |
| case 0: |
| #if !defined(RS_SERVER) && !defined(RS_COMPATIBILITY_LIB) |
| case HAL_PIXEL_FORMAT_YCrCb_420_SP: // NV21 |
| #endif |
| { |
| const uchar *pinUV = (const uchar *)cp->alloc->mHal.drvState.lod[1].mallocPtr; |
| const size_t strideUV = cp->alloc->mHal.drvState.lod[1].stride; |
| const uchar *uv = pinUV + ((p->y >> 1) * strideUV); |
| |
| if(x2 > x1) { |
| #if defined(ARCH_ARM_HAVE_NEON) |
| int32_t len = (x2 - x1 - 1) >> 3; |
| if(len > 0) { |
| rsdIntrinsicYuv_K(out, Y, uv, len, YuvCoeff); |
| x1 += len << 3; |
| out += len << 3; |
| } |
| #endif |
| |
| // ALOGE("y %i %i %i", p->y, x1, x2); |
| while(x1 < x2) { |
| uchar u = uv[(x1 & 0xffffe) + 1]; |
| uchar v = uv[(x1 & 0xffffe) + 0]; |
| *out = rsYuvToRGBA_uchar4(Y[x1], u, v); |
| out++; |
| x1++; |
| *out = rsYuvToRGBA_uchar4(Y[x1], u, v); |
| out++; |
| x1++; |
| } |
| } |
| } |
| break; |
| |
| #if !defined(RS_SERVER) && !defined(RS_COMPATIBILITY_LIB) |
| case HAL_PIXEL_FORMAT_YV12: |
| { |
| const uchar *pinU = (const uchar *)cp->alloc->mHal.drvState.lod[1].mallocPtr; |
| const size_t strideU = cp->alloc->mHal.drvState.lod[1].stride; |
| const uchar *u = pinU + ((p->y >> 1) * strideU); |
| |
| const uchar *pinV = (const uchar *)cp->alloc->mHal.drvState.lod[2].mallocPtr; |
| const size_t strideV = cp->alloc->mHal.drvState.lod[2].stride; |
| const uchar *v = pinV + ((p->y >> 1) * strideV); |
| |
| if(x2 > x1) { |
| #if defined(ARCH_ARM_HAVE_NEON) |
| int32_t len = (x2 - x1 - 1) >> 3; |
| if(len > 0) { |
| rsdIntrinsicYuv2_K(out, Y, u, v, len, YuvCoeff); |
| x1 += len << 3; |
| out += len << 3; |
| } |
| #endif |
| |
| // ALOGE("y %i %i %i", p->y, x1, x2); |
| while(x1 < x2) { |
| uchar ut = u[x1]; |
| uchar vt = v[x1]; |
| *out = rsYuvToRGBA_uchar4(Y[x1], ut, vt); |
| out++; |
| x1++; |
| *out = rsYuvToRGBA_uchar4(Y[x1], ut, vt); |
| out++; |
| x1++; |
| } |
| } |
| } |
| break; |
| #endif |
| } |
| |
| } |
| |
| RsdCpuScriptIntrinsicYuvToRGB::RsdCpuScriptIntrinsicYuvToRGB( |
| RsdCpuReferenceImpl *ctx, const Script *s, const Element *e) |
| : RsdCpuScriptIntrinsic(ctx, s, e, RS_SCRIPT_INTRINSIC_ID_YUV_TO_RGB) { |
| |
| mRootPtr = &kernel; |
| } |
| |
| RsdCpuScriptIntrinsicYuvToRGB::~RsdCpuScriptIntrinsicYuvToRGB() { |
| } |
| |
| void RsdCpuScriptIntrinsicYuvToRGB::populateScript(Script *s) { |
| s->mHal.info.exportedVariableCount = 1; |
| } |
| |
| void RsdCpuScriptIntrinsicYuvToRGB::invokeFreeChildren() { |
| alloc.clear(); |
| } |
| |
| |
| RsdCpuScriptImpl * rsdIntrinsic_YuvToRGB(RsdCpuReferenceImpl *ctx, |
| const Script *s, const Element *e) { |
| return new RsdCpuScriptIntrinsicYuvToRGB(ctx, s, e); |
| } |
| |
| |