#include "rs_core.rsh"
#include "rs_structs.h"
// Opaque Allocation type operations
extern uint32_t __attribute__((overloadable))
rsAllocationGetDimX(rs_allocation a) {
Allocation_t *alloc = (Allocation_t *)a.p;
return alloc->mHal.drvState.lod[0].dimX;
}
extern uint32_t __attribute__((overloadable))
rsAllocationGetDimY(rs_allocation a) {
Allocation_t *alloc = (Allocation_t *)a.p;
return alloc->mHal.drvState.lod[0].dimY;
}
extern uint32_t __attribute__((overloadable))
rsAllocationGetDimZ(rs_allocation a) {
Allocation_t *alloc = (Allocation_t *)a.p;
return alloc->mHal.drvState.lod[0].dimZ;
}
extern uint32_t __attribute__((overloadable))
rsAllocationGetDimLOD(rs_allocation a) {
Allocation_t *alloc = (Allocation_t *)a.p;
return alloc->mHal.state.hasMipmaps;
}
extern uint32_t __attribute__((overloadable))
rsAllocationGetDimFaces(rs_allocation a) {
Allocation_t *alloc = (Allocation_t *)a.p;
return alloc->mHal.state.hasFaces;
}
extern rs_element __attribute__((overloadable))
rsAllocationGetElement(rs_allocation a) {
Allocation_t *alloc = (Allocation_t *)a.p;
if (alloc == NULL) {
rs_element nullElem = {0};
return nullElem;
}
Type_t *type = (Type_t *)alloc->mHal.state.type;
rs_element returnElem = {type->mHal.state.element};
return returnElem;
}
// TODO: this needs to be optimized, obviously
static void memcpy(void* dst, void* src, size_t size) {
char* dst_c = (char*) dst, *src_c = (char*) src;
for (; size > 0; size--) {
*dst_c++ = *src_c++;
}
}
#ifdef RS_DEBUG_RUNTIME
#define ELEMENT_AT(T) \
extern void __attribute__((overloadable)) \
rsSetElementAt_##T(rs_allocation a, const T *val, uint32_t x); \
extern void __attribute__((overloadable)) \
rsSetElementAt_##T(rs_allocation a, const T *val, uint32_t x, uint32_t y); \
extern void __attribute__((overloadable)) \
rsSetElementAt_##T(rs_allocation a, const T *val, uint32_t x, uint32_t y, uint32_t z); \
extern void __attribute__((overloadable)) \
rsGetElementAt_##T(rs_allocation a, T *val, uint32_t x); \
extern void __attribute__((overloadable)) \
rsGetElementAt_##T(rs_allocation a, T *val, uint32_t x, uint32_t y); \
extern void __attribute__((overloadable)) \
rsGetElementAt_##T(rs_allocation a, T *val, uint32_t x, uint32_t y, uint32_t z); \
\
extern void __attribute__((overloadable)) \
rsSetElementAt_##T(rs_allocation a, T val, uint32_t x) { \
rsSetElementAt_##T(a, &val, x); \
} \
extern void __attribute__((overloadable)) \
rsSetElementAt_##T(rs_allocation a, T val, uint32_t x, uint32_t y) { \
rsSetElementAt_##T(a, &val, x, y); \
} \
extern void __attribute__((overloadable)) \
rsSetElementAt_##T(rs_allocation a, T val, uint32_t x, uint32_t y, uint32_t z) { \
rsSetElementAt_##T(a, &val, x, y, z); \
} \
extern T __attribute__((overloadable)) \
rsGetElementAt_##T(rs_allocation a, uint32_t x) { \
T tmp; \
rsGetElementAt_##T(a, &tmp, x); \
return tmp; \
} \
extern T __attribute__((overloadable)) \
rsGetElementAt_##T(rs_allocation a, uint32_t x, uint32_t y) { \
T tmp; \
rsGetElementAt_##T(a, &tmp, x, y); \
return tmp; \
} \
extern T __attribute__((overloadable)) \
rsGetElementAt_##T(rs_allocation a, uint32_t x, uint32_t y, uint32_t z) { \
T tmp; \
rsGetElementAt_##T(a, &tmp, x, y, z); \
return tmp; \
}
#else
uint8_t*
rsOffset(rs_allocation a, uint32_t sizeOf, uint32_t x, uint32_t y,
uint32_t z) {
Allocation_t *alloc = (Allocation_t *)a.p;
//#ifdef __LP64__
// uint8_t *p = (uint8_t *)a.r;
//#else
uint8_t *p = (uint8_t *)alloc->mHal.drvState.lod[0].mallocPtr;
//#endif
const uint32_t stride = (uint32_t)alloc->mHal.drvState.lod[0].stride;
const uint32_t dimY = alloc->mHal.drvState.lod[0].dimY;
uint8_t *dp = &p[(sizeOf * x) + (y * stride) +
(z * stride * dimY)];
return dp;
}
uint8_t*
rsOffsetNs(rs_allocation a, uint32_t x, uint32_t y, uint32_t z) {
Allocation_t *alloc = (Allocation_t *)a.p;
//#ifdef __LP64__
// uint8_t *p = (uint8_t *)a.r;
//#else
uint8_t *p = (uint8_t *)alloc->mHal.drvState.lod[0].mallocPtr;
//#endif
const uint32_t stride = alloc->mHal.drvState.lod[0].stride;
const uint32_t dimY = alloc->mHal.drvState.lod[0].dimY;
const uint32_t sizeOf = alloc->mHal.state.elementSizeBytes;;
uint8_t *dp = &p[(sizeOf * x) + (y * stride) +
(z * stride * dimY)];
return dp;
}
#define SET_ELEMENT_AT_TYPE(T, typename) \
\
void \
rsSetElementAtImpl_##typename(rs_allocation a, typename val, uint32_t x, \
uint32_t y, uint32_t z); \
\
extern void __attribute__((overloadable)) \
rsSetElementAt_##typename(rs_allocation a, T val, uint32_t x) { \
rsSetElementAtImpl_##typename(a, (typename)val, x, 0, 0); \
} \
\
extern void __attribute__((overloadable)) \
rsSetElementAt_##typename(rs_allocation a, T val, uint32_t x, \
uint32_t y) { \
rsSetElementAtImpl_##typename(a, (typename)val, x, y, 0); \
} \
\
extern void __attribute__((overloadable)) \
rsSetElementAt_##typename(rs_allocation a, T val, uint32_t x, uint32_t y, \
uint32_t z) { \
rsSetElementAtImpl_##typename(a, (typename)val, x, y, z); \
} \
#define GET_ELEMENT_AT_TYPE(T, typename) \
typename \
rsGetElementAtImpl_##typename(rs_allocation a, uint32_t x, uint32_t y, \
uint32_t z); \
\
extern typename __attribute__((overloadable)) \
rsGetElementAt_##typename(rs_allocation a, uint32_t x) { \
return (typename)rsGetElementAtImpl_##typename(a, x, 0, 0); \
} \
\
extern typename __attribute__((overloadable)) \
rsGetElementAt_##typename(rs_allocation a, uint32_t x, uint32_t y) { \
return (typename)rsGetElementAtImpl_##typename(a, x, y, 0); \
} \
\
extern typename __attribute__((overloadable)) \
rsGetElementAt_##typename(rs_allocation a, uint32_t x, uint32_t y, \
uint32_t z) { \
return (typename)rsGetElementAtImpl_##typename(a, x, y, z); \
}
#define SET_ELEMENT_AT(T) SET_ELEMENT_AT_TYPE(T, T)
#define GET_ELEMENT_AT(T) GET_ELEMENT_AT_TYPE(T, T)
#define ELEMENT_AT(T) \
SET_ELEMENT_AT(T) \
GET_ELEMENT_AT(T)
extern const void * __attribute__((overloadable))
rsGetElementAt(rs_allocation a, uint32_t x) {
Allocation_t *alloc = (Allocation_t *)a.p;
const uint8_t *p = (const uint8_t *)alloc->mHal.drvState.lod[0].mallocPtr;
const uint32_t eSize = alloc->mHal.state.elementSizeBytes;
return &p[eSize * x];
}
extern const void * __attribute__((overloadable))
rsGetElementAt(rs_allocation a, uint32_t x, uint32_t y) {
Allocation_t *alloc = (Allocation_t *)a.p;
const uint8_t *p = (const uint8_t *)alloc->mHal.drvState.lod[0].mallocPtr;
const uint32_t eSize = alloc->mHal.state.elementSizeBytes;
const uint32_t stride = alloc->mHal.drvState.lod[0].stride;
return &p[(eSize * x) + (y * stride)];
}
extern const void * __attribute__((overloadable))
rsGetElementAt(rs_allocation a, uint32_t x, uint32_t y, uint32_t z) {
Allocation_t *alloc = (Allocation_t *)a.p;
const uint8_t *p = (const uint8_t *)alloc->mHal.drvState.lod[0].mallocPtr;
const uint32_t eSize = alloc->mHal.state.elementSizeBytes;
const uint32_t stride = alloc->mHal.drvState.lod[0].stride;
const uint32_t dimY = alloc->mHal.drvState.lod[0].dimY;
return &p[(eSize * x) + (y * stride) + (z * stride * dimY)];
}
extern void __attribute__((overloadable))
rsSetElementAt(rs_allocation a, void* ptr, uint32_t x) {
Allocation_t *alloc = (Allocation_t *)a.p;
const uint8_t *p = (const uint8_t *)alloc->mHal.drvState.lod[0].mallocPtr;
const uint32_t eSize = alloc->mHal.state.elementSizeBytes;
memcpy((void*)&p[eSize * x], ptr, eSize);
}
extern void __attribute__((overloadable))
rsSetElementAt(rs_allocation a, void* ptr, uint32_t x, uint32_t y) {
Allocation_t *alloc = (Allocation_t *)a.p;
const uint8_t *p = (const uint8_t *)alloc->mHal.drvState.lod[0].mallocPtr;
const uint32_t eSize = alloc->mHal.state.elementSizeBytes;
const uint32_t stride = alloc->mHal.drvState.lod[0].stride;
memcpy((void*)&p[(eSize * x) + (y * stride)], ptr, eSize);
}
extern void __attribute__((overloadable))
rsSetElementAt(rs_allocation a, void* ptr, uint32_t x, uint32_t y, uint32_t z) {
Allocation_t *alloc = (Allocation_t *)a.p;
const uint8_t *p = (const uint8_t *)alloc->mHal.drvState.lod[0].mallocPtr;
const uint32_t eSize = alloc->mHal.state.elementSizeBytes;
const uint32_t stride = alloc->mHal.drvState.lod[0].stride;
const uint32_t dimY = alloc->mHal.drvState.lod[0].dimY;
memcpy((void*)&p[(eSize * x) + (y * stride) + (z * stride * dimY)], ptr, eSize);
}
#endif // RS_DEBUG_RUNTIME
ELEMENT_AT(char)
ELEMENT_AT(char2)
ELEMENT_AT(char3)
ELEMENT_AT(char4)
ELEMENT_AT(uchar)
ELEMENT_AT(uchar2)
ELEMENT_AT(uchar3)
ELEMENT_AT(uchar4)
ELEMENT_AT(short)
ELEMENT_AT(short2)
ELEMENT_AT(short3)
ELEMENT_AT(short4)
ELEMENT_AT(ushort)
ELEMENT_AT(ushort2)
ELEMENT_AT(ushort3)
ELEMENT_AT(ushort4)
ELEMENT_AT(int)
ELEMENT_AT(int2)
ELEMENT_AT(int3)
ELEMENT_AT(int4)
ELEMENT_AT(uint)
ELEMENT_AT(uint2)
ELEMENT_AT(uint3)
ELEMENT_AT(uint4)
ELEMENT_AT(long)
ELEMENT_AT(long2)
ELEMENT_AT(long3)
ELEMENT_AT(long4)
ELEMENT_AT(ulong)
ELEMENT_AT(ulong2)
ELEMENT_AT(ulong3)
ELEMENT_AT(ulong4)
ELEMENT_AT(half)
ELEMENT_AT(half2)
ELEMENT_AT(half3)
ELEMENT_AT(half4)
ELEMENT_AT(float)
ELEMENT_AT(float2)
ELEMENT_AT(float3)
ELEMENT_AT(float4)
ELEMENT_AT(double)
ELEMENT_AT(double2)
ELEMENT_AT(double3)
ELEMENT_AT(double4)
typedef unsigned long long ull;
typedef unsigned long long ull2 __attribute__((ext_vector_type(2)));
typedef unsigned long long ull3 __attribute__((ext_vector_type(3)));
typedef unsigned long long ull4 __attribute__((ext_vector_type(4)));
#ifndef RS_DEBUG_RUNTIME
SET_ELEMENT_AT_TYPE(ull, ulong)
SET_ELEMENT_AT_TYPE(ull2, ulong2)
SET_ELEMENT_AT_TYPE(ull3, ulong3)
SET_ELEMENT_AT_TYPE(ull4, ulong4)
#undef SET_ELEMENT_AT_TYPE
#undef GET_ELEMENT_AT_TYPE
#undef ELEMENT_AT_TYPE
#endif
#undef ELEMENT_AT
extern uchar __attribute__((overloadable))
rsGetElementAtYuv_uchar_Y(rs_allocation a, uint32_t x, uint32_t y) {
return rsGetElementAt_uchar(a, x, y);
}
extern uchar __attribute__((overloadable))
rsGetElementAtYuv_uchar_U(rs_allocation a, uint32_t x, uint32_t y) {
Allocation_t *alloc = (Allocation_t *)a.p;
const size_t cstep = alloc->mHal.drvState.yuv.step;
const size_t shift = alloc->mHal.drvState.yuv.shift;
const size_t stride = alloc->mHal.drvState.lod[1].stride;
const uchar *pin = (const uchar *)alloc->mHal.drvState.lod[1].mallocPtr;
return pin[((x >> shift) * cstep) + ((y >> shift) * stride)];
}
extern uchar __attribute__((overloadable))
rsGetElementAtYuv_uchar_V(rs_allocation a, uint32_t x, uint32_t y) {
Allocation_t *alloc = (Allocation_t *)a.p;
const size_t cstep = alloc->mHal.drvState.yuv.step;
const size_t shift = alloc->mHal.drvState.yuv.shift;
const size_t stride = alloc->mHal.drvState.lod[2].stride;
const uchar *pin = (const uchar *)alloc->mHal.drvState.lod[2].mallocPtr;
return pin[((x >> shift) * cstep) + ((y >> shift) * stride)];
}
#define VOP(T) \
extern void __rsAllocationVStoreXImpl_##T(rs_allocation a, const T val, uint32_t x, uint32_t y, uint32_t z); \
extern T __rsAllocationVLoadXImpl_##T(rs_allocation a, uint32_t x, uint32_t y, uint32_t z); \
\
extern void __attribute__((overloadable)) \
rsAllocationVStoreX_##T(rs_allocation a, T val, uint32_t x) { \
__rsAllocationVStoreXImpl_##T(a, val, x, 0, 0); \
} \
extern void __attribute__((overloadable)) \
rsAllocationVStoreX_##T(rs_allocation a, T val, uint32_t x, uint32_t y) { \
__rsAllocationVStoreXImpl_##T(a, val, x, y, 0); \
} \
extern void __attribute__((overloadable)) \
rsAllocationVStoreX_##T(rs_allocation a, T val, uint32_t x, uint32_t y, uint32_t z) { \
__rsAllocationVStoreXImpl_##T(a, val, x, y, z); \
} \
extern T __attribute__((overloadable)) \
rsAllocationVLoadX_##T(rs_allocation a, uint32_t x) { \
return __rsAllocationVLoadXImpl_##T(a, x, 0, 0); \
} \
extern T __attribute__((overloadable)) \
rsAllocationVLoadX_##T(rs_allocation a, uint32_t x, uint32_t y) { \
return __rsAllocationVLoadXImpl_##T(a, x, y, 0); \
} \
extern T __attribute__((overloadable)) \
rsAllocationVLoadX_##T(rs_allocation a, uint32_t x, uint32_t y, uint32_t z) { \
return __rsAllocationVLoadXImpl_##T(a, x, y, z); \
}
VOP(char2)
VOP(char3)
VOP(char4)
VOP(uchar2)
VOP(uchar3)
VOP(uchar4)
VOP(short2)
VOP(short3)
VOP(short4)
VOP(ushort2)
VOP(ushort3)
VOP(ushort4)
VOP(int2)
VOP(int3)
VOP(int4)
VOP(uint2)
VOP(uint3)
VOP(uint4)
VOP(long2)
VOP(long3)
VOP(long4)
VOP(ulong2)
VOP(ulong3)
VOP(ulong4)
VOP(float2)
VOP(float3)
VOP(float4)
VOP(double2)
VOP(double3)
VOP(double4)
#undef VOP