/* autogenerated from example3orc.orc */ #ifdef HAVE_CONFIG_H #include "config.h" #endif #ifndef _ORC_INTEGER_TYPEDEFS_ #define _ORC_INTEGER_TYPEDEFS_ #if defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L #include <stdint.h> typedef int8_t orc_int8; typedef int16_t orc_int16; typedef int32_t orc_int32; typedef int64_t orc_int64; typedef uint8_t orc_uint8; typedef uint16_t orc_uint16; typedef uint32_t orc_uint32; typedef uint64_t orc_uint64; #define ORC_UINT64_C(x) UINT64_C(x) #elif defined(_MSC_VER) typedef signed __int8 orc_int8; typedef signed __int16 orc_int16; typedef signed __int32 orc_int32; typedef signed __int64 orc_int64; typedef unsigned __int8 orc_uint8; typedef unsigned __int16 orc_uint16; typedef unsigned __int32 orc_uint32; typedef unsigned __int64 orc_uint64; #define ORC_UINT64_C(x) (x##Ui64) #define inline __inline #else #include <limits.h> typedef signed char orc_int8; typedef short orc_int16; typedef int orc_int32; typedef unsigned char orc_uint8; typedef unsigned short orc_uint16; typedef unsigned int orc_uint32; #if INT_MAX == LONG_MAX typedef long long orc_int64; typedef unsigned long long orc_uint64; #define ORC_UINT64_C(x) (x##ULL) #else typedef long orc_int64; typedef unsigned long orc_uint64; #define ORC_UINT64_C(x) (x##UL) #endif #endif typedef union { orc_int16 i; orc_int8 x2[2]; } orc_union16; typedef union { orc_int32 i; float f; orc_int16 x2[2]; orc_int8 x4[4]; } orc_union32; typedef union { orc_int64 i; double f; orc_int32 x2[2]; float x2f[2]; orc_int16 x4[4]; } orc_union64; #endif #ifndef ORC_RESTRICT #if defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L #define ORC_RESTRICT restrict #elif defined(__GNUC__) && __GNUC__ >= 4 #define ORC_RESTRICT __restrict__ #else #define ORC_RESTRICT #endif #endif #ifndef ORC_INTERNAL #if defined(__SUNPRO_C) && (__SUNPRO_C >= 0x590) #define ORC_INTERNAL __attribute__((visibility("hidden"))) #elif defined(__SUNPRO_C) && (__SUNPRO_C >= 0x550) #define ORC_INTERNAL __hidden #elif defined (__GNUC__) #define ORC_INTERNAL __attribute__((visibility("hidden"))) #else #define ORC_INTERNAL #endif #endif #ifndef DISABLE_ORC #include <orc/orc.h> #endif void convert_I420_AYUV (orc_uint32 * ORC_RESTRICT d1, int d1_stride, orc_uint32 * ORC_RESTRICT d2, int d2_stride, const orc_uint8 * ORC_RESTRICT s1, int s1_stride, const orc_uint8 * ORC_RESTRICT s2, int s2_stride, const orc_uint8 * ORC_RESTRICT s3, int s3_stride, const orc_uint8 * ORC_RESTRICT s4, int s4_stride, int n, int m); /* begin Orc C target preamble */ #define ORC_CLAMP(x,a,b) ((x)<(a) ? (a) : ((x)>(b) ? (b) : (x))) #define ORC_ABS(a) ((a)<0 ? -(a) : (a)) #define ORC_MIN(a,b) ((a)<(b) ? (a) : (b)) #define ORC_MAX(a,b) ((a)>(b) ? (a) : (b)) #define ORC_SB_MAX 127 #define ORC_SB_MIN (-1-ORC_SB_MAX) #define ORC_UB_MAX 255 #define ORC_UB_MIN 0 #define ORC_SW_MAX 32767 #define ORC_SW_MIN (-1-ORC_SW_MAX) #define ORC_UW_MAX 65535 #define ORC_UW_MIN 0 #define ORC_SL_MAX 2147483647 #define ORC_SL_MIN (-1-ORC_SL_MAX) #define ORC_UL_MAX 4294967295U #define ORC_UL_MIN 0 #define ORC_CLAMP_SB(x) ORC_CLAMP(x,ORC_SB_MIN,ORC_SB_MAX) #define ORC_CLAMP_UB(x) ORC_CLAMP(x,ORC_UB_MIN,ORC_UB_MAX) #define ORC_CLAMP_SW(x) ORC_CLAMP(x,ORC_SW_MIN,ORC_SW_MAX) #define ORC_CLAMP_UW(x) ORC_CLAMP(x,ORC_UW_MIN,ORC_UW_MAX) #define ORC_CLAMP_SL(x) ORC_CLAMP(x,ORC_SL_MIN,ORC_SL_MAX) #define ORC_CLAMP_UL(x) ORC_CLAMP(x,ORC_UL_MIN,ORC_UL_MAX) #define ORC_SWAP_W(x) ((((x)&0xff)<<8) | (((x)&0xff00)>>8)) #define ORC_SWAP_L(x) ((((x)&0xff)<<24) | (((x)&0xff00)<<8) | (((x)&0xff0000)>>8) | (((x)&0xff000000)>>24)) #define ORC_SWAP_Q(x) ((((x)&ORC_UINT64_C(0xff))<<56) | (((x)&ORC_UINT64_C(0xff00))<<40) | (((x)&ORC_UINT64_C(0xff0000))<<24) | (((x)&ORC_UINT64_C(0xff000000))<<8) | (((x)&ORC_UINT64_C(0xff00000000))>>8) | (((x)&ORC_UINT64_C(0xff0000000000))>>24) | (((x)&ORC_UINT64_C(0xff000000000000))>>40) | (((x)&ORC_UINT64_C(0xff00000000000000))>>56)) #define ORC_PTR_OFFSET(ptr,offset) ((void *)(((unsigned char *)(ptr)) + (offset))) #define ORC_DENORMAL(x) ((x) & ((((x)&0x7f800000) == 0) ? 0xff800000 : 0xffffffff)) #define ORC_ISNAN(x) ((((x)&0x7f800000) == 0x7f800000) && (((x)&0x007fffff) != 0)) #define ORC_DENORMAL_DOUBLE(x) ((x) & ((((x)&ORC_UINT64_C(0x7ff0000000000000)) == 0) ? ORC_UINT64_C(0xfff0000000000000) : ORC_UINT64_C(0xffffffffffffffff))) #define ORC_ISNAN_DOUBLE(x) ((((x)&ORC_UINT64_C(0x7ff0000000000000)) == ORC_UINT64_C(0x7ff0000000000000)) && (((x)&ORC_UINT64_C(0x000fffffffffffff)) != 0)) #ifndef ORC_RESTRICT #if defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L #define ORC_RESTRICT restrict #elif defined(__GNUC__) && __GNUC__ >= 4 #define ORC_RESTRICT __restrict__ #else #define ORC_RESTRICT #endif #endif /* end Orc C target preamble */ /* convert_I420_AYUV */ #ifdef DISABLE_ORC void convert_I420_AYUV (orc_uint32 * ORC_RESTRICT d1, int d1_stride, orc_uint32 * ORC_RESTRICT d2, int d2_stride, const orc_uint8 * ORC_RESTRICT s1, int s1_stride, const orc_uint8 * ORC_RESTRICT s2, int s2_stride, const orc_uint8 * ORC_RESTRICT s3, int s3_stride, const orc_uint8 * ORC_RESTRICT s4, int s4_stride, int n, int m){ int i; int j; orc_union32 * ORC_RESTRICT ptr0; orc_union32 * ORC_RESTRICT ptr1; const orc_int8 * ORC_RESTRICT ptr4; const orc_int8 * ORC_RESTRICT ptr5; const orc_int8 * ORC_RESTRICT ptr6; const orc_int8 * ORC_RESTRICT ptr7; orc_int8 var36; orc_int8 var37; orc_union32 var38; orc_int8 var39; orc_int8 var40; orc_union32 var41; orc_int8 var42; orc_int8 var43; orc_union16 var44; orc_union16 var45; orc_union16 var46; for (j = 0; j < m; j++) { ptr0 = ORC_PTR_OFFSET(d1, d1_stride * j); ptr1 = ORC_PTR_OFFSET(d2, d2_stride * j); ptr4 = ORC_PTR_OFFSET(s1, s1_stride * j); ptr5 = ORC_PTR_OFFSET(s2, s2_stride * j); ptr6 = ORC_PTR_OFFSET(s3, s3_stride * j); ptr7 = ORC_PTR_OFFSET(s4, s4_stride * j); /* 3: loadpb */ var36 = (int)0x000000ff; /* 255 or 1.25987e-321f */ /* 8: loadpb */ var39 = (int)0x000000ff; /* 255 or 1.25987e-321f */ for (i = 0; i < n; i++) { /* 0: loadupdb */ var42 = ptr6[i>>1]; /* 1: loadupdb */ var43 = ptr7[i>>1]; /* 2: mergebw */ { orc_union16 _dest; _dest.x2[0] = var42; _dest.x2[1] = var43; var44.i = _dest.i; } /* 4: loadb */ var37 = ptr4[i]; /* 5: mergebw */ { orc_union16 _dest; _dest.x2[0] = var36; _dest.x2[1] = var37; var45.i = _dest.i; } /* 6: mergewl */ { orc_union32 _dest; _dest.x2[0] = var45.i; _dest.x2[1] = var44.i; var38.i = _dest.i; } /* 7: storel */ ptr0[i] = var38; /* 9: loadb */ var40 = ptr5[i]; /* 10: mergebw */ { orc_union16 _dest; _dest.x2[0] = var39; _dest.x2[1] = var40; var46.i = _dest.i; } /* 11: mergewl */ { orc_union32 _dest; _dest.x2[0] = var46.i; _dest.x2[1] = var44.i; var41.i = _dest.i; } /* 12: storel */ ptr1[i] = var41; } } } #else static void _backup_convert_I420_AYUV (OrcExecutor * ORC_RESTRICT ex) { int i; int j; int n = ex->n; int m = ex->params[ORC_VAR_A1]; orc_union32 * ORC_RESTRICT ptr0; orc_union32 * ORC_RESTRICT ptr1; const orc_int8 * ORC_RESTRICT ptr4; const orc_int8 * ORC_RESTRICT ptr5; const orc_int8 * ORC_RESTRICT ptr6; const orc_int8 * ORC_RESTRICT ptr7; orc_int8 var36; orc_int8 var37; orc_union32 var38; orc_int8 var39; orc_int8 var40; orc_union32 var41; orc_int8 var42; orc_int8 var43; orc_union16 var44; orc_union16 var45; orc_union16 var46; for (j = 0; j < m; j++) { ptr0 = ORC_PTR_OFFSET(ex->arrays[0], ex->params[0] * j); ptr1 = ORC_PTR_OFFSET(ex->arrays[1], ex->params[1] * j); ptr4 = ORC_PTR_OFFSET(ex->arrays[4], ex->params[4] * j); ptr5 = ORC_PTR_OFFSET(ex->arrays[5], ex->params[5] * j); ptr6 = ORC_PTR_OFFSET(ex->arrays[6], ex->params[6] * j); ptr7 = ORC_PTR_OFFSET(ex->arrays[7], ex->params[7] * j); /* 3: loadpb */ var36 = (int)0x000000ff; /* 255 or 1.25987e-321f */ /* 8: loadpb */ var39 = (int)0x000000ff; /* 255 or 1.25987e-321f */ for (i = 0; i < n; i++) { /* 0: loadupdb */ var42 = ptr6[i>>1]; /* 1: loadupdb */ var43 = ptr7[i>>1]; /* 2: mergebw */ { orc_union16 _dest; _dest.x2[0] = var42; _dest.x2[1] = var43; var44.i = _dest.i; } /* 4: loadb */ var37 = ptr4[i]; /* 5: mergebw */ { orc_union16 _dest; _dest.x2[0] = var36; _dest.x2[1] = var37; var45.i = _dest.i; } /* 6: mergewl */ { orc_union32 _dest; _dest.x2[0] = var45.i; _dest.x2[1] = var44.i; var38.i = _dest.i; } /* 7: storel */ ptr0[i] = var38; /* 9: loadb */ var40 = ptr5[i]; /* 10: mergebw */ { orc_union16 _dest; _dest.x2[0] = var39; _dest.x2[1] = var40; var46.i = _dest.i; } /* 11: mergewl */ { orc_union32 _dest; _dest.x2[0] = var46.i; _dest.x2[1] = var44.i; var41.i = _dest.i; } /* 12: storel */ ptr1[i] = var41; } } } void convert_I420_AYUV (orc_uint32 * ORC_RESTRICT d1, int d1_stride, orc_uint32 * ORC_RESTRICT d2, int d2_stride, const orc_uint8 * ORC_RESTRICT s1, int s1_stride, const orc_uint8 * ORC_RESTRICT s2, int s2_stride, const orc_uint8 * ORC_RESTRICT s3, int s3_stride, const orc_uint8 * ORC_RESTRICT s4, int s4_stride, int n, int m) { OrcExecutor _ex, *ex = &_ex; static volatile int p_inited = 0; static OrcCode *c = 0; void (*func) (OrcExecutor *); if (!p_inited) { orc_once_mutex_lock (); if (!p_inited) { OrcProgram *p; #if 1 static const orc_uint8 bc[] = { 1, 7, 9, 17, 99, 111, 110, 118, 101, 114, 116, 95, 73, 52, 50, 48, 95, 65, 89, 85, 86, 11, 4, 4, 11, 4, 4, 12, 1, 1, 12, 1, 1, 12, 1, 1, 12, 1, 1, 14, 1, 255, 0, 0, 0, 20, 2, 20, 2, 20, 1, 20, 1, 45, 34, 6, 45, 35, 7, 196, 32, 34, 35, 196, 33, 16, 4, 195, 0, 33, 32, 196, 33, 16, 5, 195, 1, 33, 32, 2, 0, }; p = orc_program_new_from_static_bytecode (bc); orc_program_set_backup_function (p, _backup_convert_I420_AYUV); #else p = orc_program_new (); orc_program_set_2d (p); orc_program_set_name (p, "convert_I420_AYUV"); orc_program_set_backup_function (p, _backup_convert_I420_AYUV); orc_program_add_destination (p, 4, "d1"); orc_program_add_destination (p, 4, "d2"); orc_program_add_source (p, 1, "s1"); orc_program_add_source (p, 1, "s2"); orc_program_add_source (p, 1, "s3"); orc_program_add_source (p, 1, "s4"); orc_program_add_constant (p, 1, 0x000000ff, "c1"); orc_program_add_temporary (p, 2, "t1"); orc_program_add_temporary (p, 2, "t2"); orc_program_add_temporary (p, 1, "t3"); orc_program_add_temporary (p, 1, "t4"); orc_program_append_2 (p, "loadupdb", 0, ORC_VAR_T3, ORC_VAR_S3, ORC_VAR_D1, ORC_VAR_D1); orc_program_append_2 (p, "loadupdb", 0, ORC_VAR_T4, ORC_VAR_S4, ORC_VAR_D1, ORC_VAR_D1); orc_program_append_2 (p, "mergebw", 0, ORC_VAR_T1, ORC_VAR_T3, ORC_VAR_T4, ORC_VAR_D1); orc_program_append_2 (p, "mergebw", 0, ORC_VAR_T2, ORC_VAR_C1, ORC_VAR_S1, ORC_VAR_D1); orc_program_append_2 (p, "mergewl", 0, ORC_VAR_D1, ORC_VAR_T2, ORC_VAR_T1, ORC_VAR_D1); orc_program_append_2 (p, "mergebw", 0, ORC_VAR_T2, ORC_VAR_C1, ORC_VAR_S2, ORC_VAR_D1); orc_program_append_2 (p, "mergewl", 0, ORC_VAR_D2, ORC_VAR_T2, ORC_VAR_T1, ORC_VAR_D1); #endif orc_program_compile (p); c = orc_program_take_code (p); orc_program_free (p); } p_inited = TRUE; orc_once_mutex_unlock (); } ex->arrays[ORC_VAR_A2] = c; ex->program = 0; ex->n = n; ORC_EXECUTOR_M(ex) = m; ex->arrays[ORC_VAR_D1] = d1; ex->params[ORC_VAR_D1] = d1_stride; ex->arrays[ORC_VAR_D2] = d2; ex->params[ORC_VAR_D2] = d2_stride; ex->arrays[ORC_VAR_S1] = (void *)s1; ex->params[ORC_VAR_S1] = s1_stride; ex->arrays[ORC_VAR_S2] = (void *)s2; ex->params[ORC_VAR_S2] = s2_stride; ex->arrays[ORC_VAR_S3] = (void *)s3; ex->params[ORC_VAR_S3] = s3_stride; ex->arrays[ORC_VAR_S4] = (void *)s4; ex->params[ORC_VAR_S4] = s4_stride; func = c->exec; func (ex); } #endif