/** * MojoShader; generate shader programs from bytecode of compiled * Direct3D shaders. * * Please see the file LICENSE.txt in the source's root directory. * * This file written by Ryan C. Gordon. */ // !!! FIXME: I keep changing coding styles for symbols and typedefs. // !!! FIXME: do DEF* and DCL_* opcodes have to come before instructions? // !!! FIXME: my reading of the msdn spec suggests no. // Shader bytecode format is described at MSDN: // http://msdn2.microsoft.com/en-us/library/ms800307.aspx #include #include #include #include #include #include #include "mojoshader.h" // This is the highest shader version we currently support. #define MAX_SHADER_MAJOR 3 #define MAX_SHADER_MINOR 0 // You get all the profiles unless you go out of your way to disable them. #ifndef SUPPORT_PROFILE_D3D #define SUPPORT_PROFILE_D3D 1 #endif #ifndef SUPPORT_PROFILE_GLSL #define SUPPORT_PROFILE_GLSL 1 #endif // Get basic wankery out of the way here... typedef unsigned int uint; // this is a printf() helper. don't use for code. typedef uint8_t uint8; typedef uint32_t uint32; typedef int32_t int32; #ifdef __GNUC__ #define ISPRINTF(x,y) __attribute__((format (printf, x, y))) #else #define ISPRINTF(x,y) #endif #define STATICARRAYLEN(x) ( (sizeof ((x))) / (sizeof ((x)[0])) ) // Byteswap magic... #if ((defined __GNUC__) && (defined __POWERPC__)) static inline uint32 SWAP32(uint32 x) { __asm__ __volatile__("lwbrx %0,0,%1" : "=r" (x) : "r" (&x)); return x; } // SWAP32 #elif defined(__POWERPC__) static inline uint32 SWAP32(uint32 x) { return ( (((x) >> 24) & 0x000000FF) | (((x) >> 8) & 0x0000FF00) | (((x) << 8) & 0x00FF0000) | (((x) << 24) & 0xFF000000) ); } // SWAP32 #else # define SWAP32(x) (x) #endif // Shader model version magic. static inline uint32 ver_ui32(const uint8 major, const uint8 minor) { return ( (((uint32) major) << 16) | (((minor) == 0xFF) ? 0 : (minor)) ); } // version_ui32 #define SHADER_VERSION_SUPPORTED(maj, min) \ (ver_ui32(maj, min) <= ver_ui32(MAX_SHADER_MAJOR, MAX_SHADER_MINOR)) // predeclare. typedef struct Context Context; // one emit function for each opcode in each profile. typedef void (*emit_function)(Context *ctx); // one emit function for comments in each profile. typedef void (*emit_comment)(Context *ctx, const char *str); // one emit function for starting output in each profile. typedef void (*emit_start)(Context *ctx); // one emit function for ending output in each profile. typedef void (*emit_end)(Context *ctx); // one args function for each possible sequence of opcode arguments. typedef int (*args_function)(Context *ctx); // one state function for each opcode where we have state machine updates. typedef int (*state_function)(Context *ctx); typedef struct { const char *name; emit_start start_emitter; emit_end end_emitter; emit_comment comment_emitter; } Profile; typedef enum { SHADER_TYPE_UNKNOWN = -1, SHADER_TYPE_PIXEL, SHADER_TYPE_VERTEX, SHADER_TYPE_TOTAL } ShaderType; typedef enum { REGISTER_TYPE_TEMP = 0, REGISTER_TYPE_INPUT = 1, REGISTER_TYPE_CONST = 2, REGISTER_TYPE_ADDR = 3, REGISTER_TYPE_TEXTURE = 3, // ALSO 3! REGISTER_TYPE_RASTOUT = 4, REGISTER_TYPE_ATTROUT = 5, REGISTER_TYPE_TEXCRDOUT = 6, REGISTER_TYPE_OUTPUT = 6, // ALSO 6! REGISTER_TYPE_CONSTINT = 7, REGISTER_TYPE_COLOROUT = 8, REGISTER_TYPE_DEPTHOUT = 9, REGISTER_TYPE_SAMPLER = 10, REGISTER_TYPE_CONST2 = 11, REGISTER_TYPE_CONST3 = 12, REGISTER_TYPE_CONST4 = 13, REGISTER_TYPE_CONSTBOOL = 14, REGISTER_TYPE_LOOP = 15, REGISTER_TYPE_TEMPFLOAT16 = 16, REGISTER_TYPE_MISCTYPE = 17, REGISTER_TYPE_LABEL = 18, REGISTER_TYPE_PREDICATE = 19, REGISTER_TYPE_MAX = 19 } RegisterType; typedef enum { RASTOUT_TYPE_POSITION = 0, RASTOUT_TYPE_FOG = 1, RASTOUT_TYPE_POINT_SIZE = 2, RASTOUT_TYPE_MAX = 2 } RastOutType; typedef enum { MISCTYPE_TYPE_POSITION = 0, MISCTYPE_TYPE_FACE = 1, MISCTYPE_TYPE_MAX = 1 } MiscTypeType; typedef enum { DECLUSAGE_POSITION = 0, DECLUSAGE_BLENDWEIGHT = 1, DECLUSAGE_BLENDINDICES = 2, DECLUSAGE_NORMAL = 3, DECLUSAGE_PSIZE = 4, DECLUSAGE_TEXCOORD = 5, DECLUSAGE_TANGENT = 6, DECLUSAGE_BINORMAL = 7, DECLUSAGE_TESSFACTOR = 8, DECLUSAGE_POSITIONT = 9, DECLUSAGE_COLOR = 10, DECLUSAGE_FOG = 11, DECLUSAGE_DEPTH = 12, DECLUSAGE_SAMPLE = 13 } DeclUsageType; typedef enum { TEXTURE_TYPE_2D = 2, TEXTURE_TYPE_CUBE = 3, TEXTURE_TYPE_VOLUME = 4, } TextureType; // A simple linked list of strings, so we can build the final output without // realloc()ing for each new line, and easily insert lines into the middle // of the output without much trouble. typedef struct OutputList { char *str; struct OutputList *next; } OutputList; // result modifiers. #define MOD_SATURATE 0x01 #define MOD_PP 0x02 #define MOD_CENTROID 0x04 // source modifiers. typedef enum { SRCMOD_NONE, SRCMOD_NEGATE, SRCMOD_BIAS, SRCMOD_BIASNEGATE, SRCMOD_SIGN, SRCMOD_SIGNNEGATE, SRCMOD_COMPLEMENT, SRCMOD_X2, SRCMOD_X2NEGATE, SRCMOD_DZ, SRCMOD_DW, SRCMOD_ABS, SRCMOD_ABSNEGATE, SRCMOD_NOT, SRCMOD_TOTAL } SourceMod; typedef struct { const uint32 *token; // this is the unmolested token in the stream. int regnum; int relative; int writemask; // xyzw or rgba (all four, not split out). int writemask0; // x or red int writemask1; // y or green int writemask2; // z or blue int writemask3; // w or alpha int result_mod; int result_shift; int regtype; } DestArgInfo; typedef struct { const uint32 *token; // this is the unmolested token in the stream. int regnum; int relative; int swizzle; // xyzw (all four, not split out). int swizzle_x; int swizzle_y; int swizzle_z; int swizzle_w; int src_mod; int regtype; } SourceArgInfo; #define SCRATCH_BUFFER_SIZE 256 #define SCRATCH_BUFFERS 10 // Context...this is state that changes as we parse through a shader... struct Context { MOJOSHADER_malloc malloc; MOJOSHADER_free free; const uint32 *tokens; uint32 tokencount; OutputList output; OutputList *output_tail; int output_len; // total strlen; prevents walking the list just to malloc. const char *endline; int endline_len; const char *failstr; char scratch[SCRATCH_BUFFERS][SCRATCH_BUFFER_SIZE]; int scratchidx; // current scratch buffer. int profileid; const Profile *profile; ShaderType shader_type; uint32 major_ver; uint32 minor_ver; DestArgInfo dest_args[1]; SourceArgInfo source_args[4]; uint32 dwords[4]; uint32 instruction_count; uint32 instruction_controls; }; static inline char *get_scratch_buffer(Context *ctx) { ctx->scratchidx = (ctx->scratchidx + 1) % SCRATCH_BUFFERS; return ctx->scratch[ctx->scratchidx]; } // get_scratch_buffer // Special-case return values from the parsing pipeline... #define FAIL (-1) #define END_OF_STREAM (-2) static const char *out_of_mem_string = "Out of memory"; static inline int out_of_memory(Context *ctx) { if (ctx->failstr == NULL) ctx->failstr = out_of_mem_string; // fail() would call malloc(). return FAIL; } // out_of_memory static int failf(Context *ctx, const char *fmt, ...) ISPRINTF(2,3); static int failf(Context *ctx, const char *fmt, ...) { if (ctx->failstr == NULL) // don't change existing error. { char *scratch = get_scratch_buffer(ctx); va_list ap; va_start(ap, fmt); const int len = vsnprintf(scratch,SCRATCH_BUFFER_SIZE,fmt,ap); va_end(ap); char *failstr = (char *) ctx->malloc(len + 1); if (failstr == NULL) out_of_memory(ctx); else { // see comments about scratch buffer overflow in output_line(). if (len < SCRATCH_BUFFER_SIZE) strcpy(failstr, scratch); // copy it over. else { va_start(ap, fmt); vsnprintf(failstr, len + 1, fmt, ap); // rebuild it. va_end(ap); } // else ctx->failstr = failstr; } // else } // if return FAIL; } // failf static inline int fail(Context *ctx, const char *reason) { return failf(ctx, "%s", reason); } // fail static int output_line(Context *ctx, const char *fmt, ...) ISPRINTF(2,3); static int output_line(Context *ctx, const char *fmt, ...) { if (ctx->failstr != NULL) return FAIL; // we failed previously, don't go on... OutputList *item = (OutputList *) ctx->malloc(sizeof (OutputList)); if (item == NULL) return out_of_memory(ctx); char *scratch = get_scratch_buffer(ctx); va_list ap; va_start(ap, fmt); const int len = vsnprintf(scratch, SCRATCH_BUFFER_SIZE, fmt, ap); va_end(ap); item->str = (char *) ctx->malloc(len + 1); if (item->str == NULL) { free(item); return out_of_memory(ctx); } // if // If we overflowed our scratch buffer, that's okay. We were going to // allocate anyhow...the scratch buffer just lets us avoid a second // run of vsnprintf(). if (len < SCRATCH_BUFFER_SIZE) strcpy(item->str, scratch); // copy it over. else { va_start(ap, fmt); vsnprintf(item->str, len + 1, fmt, ap); // rebuild it. va_end(ap); } // else item->next = NULL; ctx->output_tail->next = item; ctx->output_tail = item; ctx->output_len += len + ctx->endline_len; return 0; } // output_line // if SUPPORT_PROFILE_* isn't defined, we assume an implicit desire to support. #define AT_LEAST_ONE_PROFILE 0 #if !SUPPORT_PROFILE_D3D #define PROFILE_EMITTER_D3D(op) #else #undef AT_LEAST_ONE_PROFILE #define AT_LEAST_ONE_PROFILE 1 #define PROFILE_EMITTER_D3D(op) emit_D3D_##op, static const char *get_D3D_register_string(Context *ctx, RegisterType regtype, int regnum, char *regnum_str, size_t regnum_size) { const char *retval = NULL; int has_number = 1; switch (regtype) { case REGISTER_TYPE_TEMP: retval = "r"; break; case REGISTER_TYPE_INPUT: retval = "v"; break; case REGISTER_TYPE_CONST: retval = "c"; break; case REGISTER_TYPE_CONST2: retval = "c"; regnum += 2048; break; case REGISTER_TYPE_CONST3: retval = "c"; regnum += 4096; break; case REGISTER_TYPE_CONST4: retval = "c"; regnum += 6144; break; case REGISTER_TYPE_ADDR: // (or REGISTER_TYPE_TEXTURE, same value.) retval = (ctx->shader_type == SHADER_TYPE_VERTEX) ? "a" : "t"; break; case REGISTER_TYPE_RASTOUT: switch ((RastOutType) regnum) { case RASTOUT_TYPE_POSITION: retval = "oPos"; break; case RASTOUT_TYPE_FOG: retval = "oFog"; break; case RASTOUT_TYPE_POINT_SIZE: retval = "oPts"; break; } // switch has_number = 0; break; case REGISTER_TYPE_ATTROUT: retval = "oD"; break; case REGISTER_TYPE_TEXCRDOUT: // (or REGISTER_TYPE_OUTPUT, same value.) if ((ctx->shader_type==SHADER_TYPE_VERTEX) && (ctx->major_ver>=3)) retval = "o"; else retval = "oT"; break; case REGISTER_TYPE_CONSTINT: retval = "i"; break; case REGISTER_TYPE_COLOROUT: retval = "oC"; break; case REGISTER_TYPE_DEPTHOUT: retval = "oDepth"; has_number = 0; break; case REGISTER_TYPE_SAMPLER: retval = "s"; break; case REGISTER_TYPE_CONSTBOOL: retval = "b"; break; case REGISTER_TYPE_LOOP: retval = "aL"; has_number = 0; break; // !!! FIXME: don't know what the asm string is for this.. // case REGISTER_TYPE_TEMPFLOAT16: case REGISTER_TYPE_MISCTYPE: switch ((MiscTypeType) regnum) { case MISCTYPE_TYPE_POSITION: retval = "vPos"; break; case MISCTYPE_TYPE_FACE: retval = "vFace"; break; } // switch has_number = 0; break; case REGISTER_TYPE_LABEL: retval = "l"; break; case REGISTER_TYPE_PREDICATE: retval = "p"; break; } // switch if (has_number) snprintf(regnum_str, regnum_size, "%u", (uint) regnum); else regnum_str[0] = '\0'; return retval; } // get_D3D_register_string static char *make_D3D_destarg_string(Context *ctx, const int idx) { if (idx >= STATICARRAYLEN(ctx->dest_args)) { fail(ctx, "Too many destination args"); return ""; } // if const DestArgInfo *arg = &ctx->dest_args[idx]; const char *result_shift_str = ""; switch (arg->result_shift) { case 0x1: result_shift_str = "_x2"; break; case 0x2: result_shift_str = "_x4"; break; case 0x3: result_shift_str = "_x8"; break; case 0xD: result_shift_str = "_d8"; break; case 0xE: result_shift_str = "_d4"; break; case 0xF: result_shift_str = "_d2"; break; } // switch const char *sat_str = (arg->result_mod & MOD_SATURATE) ? "_sat" : ""; const char *pp_str = (arg->result_mod & MOD_PP) ? "_pp" : ""; const char *cent_str = (arg->result_mod & MOD_CENTROID) ? "_centroid" : ""; char regnum_str[16]; const char *regtype_str = get_D3D_register_string(ctx, (RegisterType) arg->regtype, arg->regnum, regnum_str, sizeof (regnum_str)); if (regtype_str == NULL) { fail(ctx, "Unknown destination register type."); return ""; } // if char writemask_str[6]; int i = 0; if (arg->writemask != 0xF) // 0xF == 1111. No explicit mask. { writemask_str[i++] = '.'; if (arg->writemask0) writemask_str[i++] = 'x'; if (arg->writemask1) writemask_str[i++] = 'y'; if (arg->writemask2) writemask_str[i++] = 'z'; if (arg->writemask3) writemask_str[i++] = 'w'; } // if writemask_str[i] = '\0'; assert(i < sizeof (writemask_str)); // may turn out something like "_x2_sat_pp_centroid r0.xyzw" ... char *retval = get_scratch_buffer(ctx); snprintf(retval, SCRATCH_BUFFER_SIZE, "%s%s%s%s %s%s%s", result_shift_str, sat_str, pp_str, cent_str, regtype_str, regnum_str, writemask_str); return retval; } // make_D3D_destarg_string static char *make_D3D_sourcearg_string(Context *ctx, const int idx) { if (idx >= STATICARRAYLEN(ctx->source_args)) { fail(ctx, "Too many source args"); return ""; } // if const SourceArgInfo *arg = &ctx->source_args[idx]; const char *premod_str = ""; const char *postmod_str = ""; switch ((SourceMod) arg->src_mod) { case SRCMOD_NEGATE: premod_str = "-"; break; case SRCMOD_BIASNEGATE: premod_str = "-"; // fall through. case SRCMOD_BIAS: postmod_str = "_bias"; break; case SRCMOD_SIGNNEGATE: premod_str = "-"; // fall through. case SRCMOD_SIGN: postmod_str = "_bx2"; break; case SRCMOD_COMPLEMENT: premod_str = "1-"; break; case SRCMOD_X2NEGATE: premod_str = "-"; // fall through. case SRCMOD_X2: postmod_str = "_x2"; break; case SRCMOD_DZ: postmod_str = "_dz"; break; case SRCMOD_DW: postmod_str = "_dw"; break; case SRCMOD_ABSNEGATE: premod_str = "-"; // fall through. case SRCMOD_ABS: postmod_str = "_abs"; break; case SRCMOD_NOT: premod_str = "!"; break; } // switch char regnum_str[16]; const char *regtype_str = get_D3D_register_string(ctx, (RegisterType) arg->regtype, arg->regnum, regnum_str, sizeof (regnum_str)); if (regtype_str == NULL) { fail(ctx, "Unknown source register type."); return ""; } // if char swizzle_str[6]; int i = 0; if (arg->swizzle != 0xE4) // 0xE4 == 11100100 ... 3 2 1 0. No swizzle. { static const char channel[] = { 'x', 'y', 'z', 'w' }; swizzle_str[i++] = '.'; swizzle_str[i++] = channel[arg->swizzle_x]; swizzle_str[i++] = channel[arg->swizzle_y]; swizzle_str[i++] = channel[arg->swizzle_z]; swizzle_str[i++] = channel[arg->swizzle_w]; // .xyzz is the same as .xyz, .z is the same as .zzzz, etc. while (swizzle_str[i-1] == swizzle_str[i-2]) i--; } // if swizzle_str[i] = '\0'; assert(i < sizeof (swizzle_str)); char *retval = get_scratch_buffer(ctx); snprintf(retval, SCRATCH_BUFFER_SIZE, "%s%s%s%s", premod_str, regtype_str, postmod_str, swizzle_str); return retval; } // make_D3D_sourcearg_string static void emit_D3D_start(Context *ctx) { const uint major = (uint) ctx->major_ver; const uint minor = (uint) ctx->minor_ver; const char *shadertype_str = NULL; char minor_str[16]; if (minor == 0xFF) strcpy(minor_str, "sw"); else if (minor == 0x1) // apparently this is "vs_2_x". Weird. strcpy(minor_str, "x"); else snprintf(minor_str, sizeof (minor_str), "%u", (uint) minor); if (ctx->shader_type == SHADER_TYPE_PIXEL) shadertype_str = "ps"; else if (ctx->shader_type == SHADER_TYPE_VERTEX) shadertype_str = "vs"; else { failf(ctx, "Shader type %u unsupported in this profile.", (uint) ctx->shader_type); return; } // else output_line(ctx, "%s_%u_%s", shadertype_str, major, minor_str); } // emit_D3D_start static void emit_D3D_end(Context *ctx) { output_line(ctx, "end"); } // emit_D3D_end static void emit_D3D_comment(Context *ctx, const char *str) { output_line(ctx, "; %s", str); } // emit_D3D_comment static void emit_D3D_RESERVED(Context *ctx) { // do nothing; fails in the state machine. } // emit_D3D_RESERVED // Generic D3D opcode emitters. A list of macros generate all the entry points // that call into these... static char *lowercase(char *dst, const char *src) { int i = 0; do { const char ch = src[i]; dst[i] = (((ch >= 'A') && (ch <= 'Z')) ? (ch - ('A' - 'a')) : ch); } while (src[i++]); return dst; } // lowercase static void emit_D3D_opcode_d(Context *ctx, const char *opcode) { const char *dst0 = make_D3D_destarg_string(ctx, 0); opcode = lowercase(get_scratch_buffer(ctx), opcode); output_line(ctx, "%s%s", opcode, dst0); } // emit_D3D_opcode_d static void emit_D3D_opcode_s(Context *ctx, const char *opcode) { const char *src0 = make_D3D_destarg_string(ctx, 0); opcode = lowercase(get_scratch_buffer(ctx), opcode); output_line(ctx, "%s %s", opcode, src0); } // emit_D3D_opcode_s static void emit_D3D_opcode_ss(Context *ctx, const char *opcode) { const char *src0 = make_D3D_sourcearg_string(ctx, 0); const char *src1 = make_D3D_sourcearg_string(ctx, 1); opcode = lowercase(get_scratch_buffer(ctx), opcode); output_line(ctx, "%s %s, %s", opcode, src0, src1); } // emit_D3D_opcode_s static void emit_D3D_opcode_ds(Context *ctx, const char *opcode) { const char *dst0 = make_D3D_destarg_string(ctx, 0); const char *src0 = make_D3D_sourcearg_string(ctx, 0); opcode = lowercase(get_scratch_buffer(ctx), opcode); output_line(ctx, "%s%s, %s", opcode, dst0, src0); } // emit_D3D_opcode_ds static void emit_D3D_opcode_dss(Context *ctx, const char *opcode) { const char *dst0 = make_D3D_destarg_string(ctx, 0); const char *src0 = make_D3D_sourcearg_string(ctx, 0); const char *src1 = make_D3D_sourcearg_string(ctx, 1); opcode = lowercase(get_scratch_buffer(ctx), opcode); output_line(ctx, "%s%s, %s, %s", opcode, dst0, src0, src1); } // emit_D3D_opcode_dss static void emit_D3D_opcode_dsss(Context *ctx, const char *opcode) { const char *dst0 = make_D3D_destarg_string(ctx, 0); const char *src0 = make_D3D_sourcearg_string(ctx, 0); const char *src1 = make_D3D_sourcearg_string(ctx, 1); const char *src2 = make_D3D_sourcearg_string(ctx, 2); opcode = lowercase(get_scratch_buffer(ctx), opcode); output_line(ctx, "%s%s, %s, %s, %s", opcode, dst0, src0, src1, src2); } // emit_D3D_opcode_dsss static void emit_D3D_opcode_dssss(Context *ctx, const char *opcode) { const char *dst0 = make_D3D_destarg_string(ctx, 0); const char *src0 = make_D3D_sourcearg_string(ctx, 0); const char *src1 = make_D3D_sourcearg_string(ctx, 1); const char *src2 = make_D3D_sourcearg_string(ctx, 2); const char *src3 = make_D3D_sourcearg_string(ctx, 3); opcode = lowercase(get_scratch_buffer(ctx), opcode); output_line(ctx,"%s%s, %s, %s, %s, %s",opcode,dst0,src0,src1,src2,src3); } // emit_D3D_opcode_dssss static void emit_D3D_opcode(Context *ctx, const char *opcode) { opcode = lowercase(get_scratch_buffer(ctx), opcode); output_line(ctx, "%s", opcode); } // emit_D3D_opcode_dssss #define EMIT_D3D_OPCODE_FUNC(op) \ static void emit_D3D_##op(Context *ctx) { \ emit_D3D_opcode(ctx, #op); \ } #define EMIT_D3D_OPCODE_D_FUNC(op) \ static void emit_D3D_##op(Context *ctx) { \ emit_D3D_opcode_d(ctx, #op); \ } #define EMIT_D3D_OPCODE_S_FUNC(op) \ static void emit_D3D_##op(Context *ctx) { \ emit_D3D_opcode_s(ctx, #op); \ } #define EMIT_D3D_OPCODE_SS_FUNC(op) \ static void emit_D3D_##op(Context *ctx) { \ emit_D3D_opcode_ss(ctx, #op); \ } #define EMIT_D3D_OPCODE_DS_FUNC(op) \ static void emit_D3D_##op(Context *ctx) { \ emit_D3D_opcode_ds(ctx, #op); \ } #define EMIT_D3D_OPCODE_DSS_FUNC(op) \ static void emit_D3D_##op(Context *ctx) { \ emit_D3D_opcode_dss(ctx, #op); \ } #define EMIT_D3D_OPCODE_DSSS_FUNC(op) \ static void emit_D3D_##op(Context *ctx) { \ emit_D3D_opcode_dsss(ctx, #op); \ } #define EMIT_D3D_OPCODE_DSSSS_FUNC(op) \ static void emit_D3D_##op(Context *ctx) { \ emit_D3D_opcode_dssss(ctx, #op); \ } EMIT_D3D_OPCODE_FUNC(NOP) EMIT_D3D_OPCODE_DS_FUNC(MOV) EMIT_D3D_OPCODE_DSS_FUNC(ADD) EMIT_D3D_OPCODE_DSS_FUNC(SUB) EMIT_D3D_OPCODE_DSSS_FUNC(MAD) EMIT_D3D_OPCODE_DSS_FUNC(MUL) EMIT_D3D_OPCODE_DS_FUNC(RCP) EMIT_D3D_OPCODE_DS_FUNC(RSQ) EMIT_D3D_OPCODE_DSS_FUNC(DP3) EMIT_D3D_OPCODE_DSS_FUNC(DP4) EMIT_D3D_OPCODE_DSS_FUNC(MIN) EMIT_D3D_OPCODE_DSS_FUNC(MAX) EMIT_D3D_OPCODE_DSS_FUNC(SLT) EMIT_D3D_OPCODE_DSS_FUNC(SGE) EMIT_D3D_OPCODE_DS_FUNC(EXP) EMIT_D3D_OPCODE_DS_FUNC(LOG) EMIT_D3D_OPCODE_DS_FUNC(LIT) EMIT_D3D_OPCODE_DSS_FUNC(DST) EMIT_D3D_OPCODE_DSSS_FUNC(LRP) EMIT_D3D_OPCODE_DS_FUNC(FRC) EMIT_D3D_OPCODE_DSS_FUNC(M4X4) EMIT_D3D_OPCODE_DSS_FUNC(M4X3) EMIT_D3D_OPCODE_DSS_FUNC(M3X4) EMIT_D3D_OPCODE_DSS_FUNC(M3X3) EMIT_D3D_OPCODE_DSS_FUNC(M3X2) EMIT_D3D_OPCODE_S_FUNC(CALL) EMIT_D3D_OPCODE_SS_FUNC(CALLNZ) EMIT_D3D_OPCODE_SS_FUNC(LOOP) EMIT_D3D_OPCODE_FUNC(RET) EMIT_D3D_OPCODE_FUNC(ENDLOOP) EMIT_D3D_OPCODE_S_FUNC(LABEL) EMIT_D3D_OPCODE_DSS_FUNC(POW) EMIT_D3D_OPCODE_DSS_FUNC(CRS) EMIT_D3D_OPCODE_DSSS_FUNC(SGN) EMIT_D3D_OPCODE_DS_FUNC(ABS) EMIT_D3D_OPCODE_DS_FUNC(NRM) EMIT_D3D_OPCODE_DS_FUNC(SINCOS) EMIT_D3D_OPCODE_S_FUNC(REP) EMIT_D3D_OPCODE_FUNC(ENDREP) EMIT_D3D_OPCODE_S_FUNC(IF) EMIT_D3D_OPCODE_FUNC(ELSE) EMIT_D3D_OPCODE_FUNC(ENDIF) EMIT_D3D_OPCODE_FUNC(BREAK) EMIT_D3D_OPCODE_DS_FUNC(MOVA) EMIT_D3D_OPCODE_FUNC(TEXCOORD) // !!! FIXME! EMIT_D3D_OPCODE_D_FUNC(TEXKILL) EMIT_D3D_OPCODE_FUNC(TEX) // !!! FIXME! EMIT_D3D_OPCODE_DS_FUNC(TEXBEM) EMIT_D3D_OPCODE_DS_FUNC(TEXBEML) EMIT_D3D_OPCODE_DS_FUNC(TEXREG2AR) EMIT_D3D_OPCODE_DS_FUNC(TEXREG2GB) EMIT_D3D_OPCODE_DS_FUNC(TEXM3X2PAD) EMIT_D3D_OPCODE_DS_FUNC(TEXM3X2TEX) EMIT_D3D_OPCODE_DS_FUNC(TEXM3X3PAD) EMIT_D3D_OPCODE_DS_FUNC(TEXM3X3TEX) EMIT_D3D_OPCODE_DSS_FUNC(TEXM3X3SPEC) EMIT_D3D_OPCODE_DS_FUNC(TEXM3X3VSPEC) EMIT_D3D_OPCODE_DS_FUNC(EXPP) EMIT_D3D_OPCODE_DS_FUNC(LOGP) EMIT_D3D_OPCODE_DSSS_FUNC(CND) EMIT_D3D_OPCODE_DS_FUNC(TEXREG2RGB) EMIT_D3D_OPCODE_DS_FUNC(TEXDP3TEX) EMIT_D3D_OPCODE_DS_FUNC(TEXM3X2DEPTH) EMIT_D3D_OPCODE_DS_FUNC(TEXDP3) EMIT_D3D_OPCODE_DS_FUNC(TEXM3X3) EMIT_D3D_OPCODE_D_FUNC(TEXDEPTH) EMIT_D3D_OPCODE_DSSS_FUNC(CMP) EMIT_D3D_OPCODE_DSS_FUNC(BEM) EMIT_D3D_OPCODE_DSSS_FUNC(DP2ADD) EMIT_D3D_OPCODE_DS_FUNC(DSX) EMIT_D3D_OPCODE_DS_FUNC(DSY) EMIT_D3D_OPCODE_DSSSS_FUNC(TEXLDD) EMIT_D3D_OPCODE_DSS_FUNC(TEXLDL) EMIT_D3D_OPCODE_S_FUNC(BREAKP) // special cases for comparison opcodes... static const char *get_D3D_comparison_string(Context *ctx) { static const char *comps[] = { "", "_gt", "_eq", "_ge", "_lt", "_ne", "_le" }; if (ctx->instruction_controls >= STATICARRAYLEN(comps)) { fail(ctx, "unknown comparison control"); return ""; } // if return comps[ctx->instruction_controls]; } // get_D3D_comparison_string static void emit_D3D_BREAKC(Context *ctx) { char op[16]; snprintf(op, sizeof (op), "break%s", get_D3D_comparison_string(ctx)); emit_D3D_opcode_ss(ctx, op); } // emit_D3D_BREAKC static void emit_D3D_IFC(Context *ctx) { char op[16]; snprintf(op, sizeof (op), "if%s", get_D3D_comparison_string(ctx)); emit_D3D_opcode_ss(ctx, op); } // emit_D3D_IFC static void emit_D3D_SETP(Context *ctx) { char op[16]; snprintf(op, sizeof (op), "setp%s", get_D3D_comparison_string(ctx)); emit_D3D_opcode_dss(ctx, op); } // emit_D3D_SETP // !!! FIXME: this is sort of nasty. static void floatstr(Context *ctx, char *buf, size_t bufsize, float f) { const size_t len = snprintf(buf, bufsize, "%f", f); if (len >= bufsize) fail(ctx, "BUG: internal buffer is too small"); else { char *end = buf + len; char *ptr = strchr(buf, '.'); if (ptr == NULL) return; // done. while (--end != ptr) { if (*end != '0') { end++; break; } // if } // while *end = '\0'; // chop extra '0' or all decimal places off. } // else } // floatstr static void emit_D3D_DEF(Context *ctx) { const char *dst0 = make_D3D_destarg_string(ctx, 0); const float *val = (const float *) ctx->dwords; // !!! FIXME: could be int? char val0[32]; char val1[32]; char val2[32]; char val3[32]; floatstr(ctx, val0, sizeof (val0), val[0]); floatstr(ctx, val1, sizeof (val1), val[1]); floatstr(ctx, val2, sizeof (val2), val[2]); floatstr(ctx, val3, sizeof (val3), val[3]); output_line(ctx, "def%s, %s, %s, %s, %s", dst0, val0, val1, val2, val3); } // emit_D3D_DEF static void emit_D3D_DEFI(Context *ctx) { const char *dst0 = make_D3D_destarg_string(ctx, 0); const int32 *x = (const int32 *) ctx->dwords; output_line(ctx, "defi%s, %d, %d, %d, %d", dst0, (int) x[0], (int) x[1], (int) x[2], (int) x[3]); } // emit_D3D_DEFI static void emit_D3D_DEFB(Context *ctx) { const char *dst0 = make_D3D_destarg_string(ctx, 0); output_line(ctx, "defb%s, %s", dst0, ctx->dwords[0] ? "true" : "false"); } // emit_D3D_DEFB static void emit_D3D_DCL(Context *ctx) { const char *dst0 = make_D3D_destarg_string(ctx, 0); const DestArgInfo *arg = &ctx->dest_args[0]; const char *usage_str = ""; char index_str[16] = { '\0' }; if (ctx->shader_type == SHADER_TYPE_VERTEX) { static const char *usagestrs[] = { "_position", "_blendweight", "_blendindices", "_normal", "_psize", "_texcoord", "_tangent", "_binormal", "_tessfactor", "_positiont", "_color", "_fog", "_depth", "_sample" }; const uint32 usage = ctx->dwords[0]; const uint32 index = ctx->dwords[1]; if (usage >= STATICARRAYLEN(usagestrs)) { fail(ctx, "unknown DCL usage"); return; } // if usage_str = usagestrs[usage]; if (index != 0) snprintf(index_str, sizeof (index_str), "%u", (uint) index); } // if else if (arg->regtype == REGISTER_TYPE_SAMPLER) { switch ((const TextureType) ctx->dwords[0]) { case TEXTURE_TYPE_2D: usage_str = "_2d"; break; case TEXTURE_TYPE_CUBE: usage_str = "_cube"; break; case TEXTURE_TYPE_VOLUME: usage_str = "_volume"; break; default: fail(ctx, "unknown sampler texture type"); return; } // switch } // else if output_line(ctx, "dcl%s%s%s", usage_str, index_str, dst0); } // emit_D3D_DCL #undef EMIT_D3D_OPCODE_FUNC #undef EMIT_D3D_OPCODE_D_FUNC #undef EMIT_D3D_OPCODE_S_FUNC #undef EMIT_D3D_OPCODE_SS_FUNC #undef EMIT_D3D_OPCODE_DS_FUNC #undef EMIT_D3D_OPCODE_DSS_FUNC #undef EMIT_D3D_OPCODE_DSSS_FUNC #undef EMIT_D3D_OPCODE_DSSSS_FUNC #endif // SUPPORT_PROFILE_D3D #if !SUPPORT_PROFILE_GLSL #define PROFILE_EMITTER_GLSL(op) #else #undef AT_LEAST_ONE_PROFILE #define AT_LEAST_ONE_PROFILE 1 #define PROFILE_EMITTER_GLSL(op) emit_GLSL_##op, static void emit_GLSL_start(Context *ctx) { const uint major = (uint) ctx->major_ver; const uint minor = (uint) ctx->minor_ver; if (ctx->shader_type == SHADER_TYPE_PIXEL) output_line(ctx, "// Pixel shader, version %u.%u", major, minor); else if (ctx->shader_type == SHADER_TYPE_VERTEX) output_line(ctx, "// Vertex shader, version %u.%u", major, minor); else { failf(ctx, "Shader type %u unsupported in this profile.", (uint) ctx->shader_type); } // else output_line(ctx, "void main() {"); } // emit_GLSL_start static void emit_GLSL_end(Context *ctx) { output_line(ctx, "}"); } // emit_GLSL_end static void emit_GLSL_comment(Context *ctx, const char *str) { output_line(ctx, "// %s", str); } // emit_GLSL_comment static void emit_GLSL_NOP(Context *ctx) { // no-op is a no-op. :) } // emit_GLSL_NOP static void emit_GLSL_MOV(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_MOV static void emit_GLSL_ADD(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_ADD static void emit_GLSL_SUB(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_SUB static void emit_GLSL_MAD(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_MAD static void emit_GLSL_MUL(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_MUL static void emit_GLSL_RCP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_RCP static void emit_GLSL_RSQ(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_RSQ static void emit_GLSL_DP3(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_DP3 static void emit_GLSL_DP4(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_DP4 static void emit_GLSL_MIN(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_MIN static void emit_GLSL_MAX(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_MAX static void emit_GLSL_SLT(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_SLT static void emit_GLSL_SGE(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_SGE static void emit_GLSL_EXP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_EXP static void emit_GLSL_LOG(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_LOG static void emit_GLSL_LIT(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_LIT static void emit_GLSL_DST(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_DST static void emit_GLSL_LRP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_LRP static void emit_GLSL_FRC(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_FRC static void emit_GLSL_M4X4(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_M4X4 static void emit_GLSL_M4X3(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_M4X3 static void emit_GLSL_M3X4(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_M3X4 static void emit_GLSL_M3X3(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_M3X3 static void emit_GLSL_M3X2(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_M3X2 static void emit_GLSL_CALL(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_CALL static void emit_GLSL_CALLNZ(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_CALLNZ static void emit_GLSL_LOOP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_LOOP static void emit_GLSL_RET(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_RET static void emit_GLSL_ENDLOOP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_ENDLOOP static void emit_GLSL_LABEL(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_LABEL static void emit_GLSL_DCL(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_DCL static void emit_GLSL_POW(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_POW static void emit_GLSL_CRS(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_CRS static void emit_GLSL_SGN(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_SGN static void emit_GLSL_ABS(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_ABS static void emit_GLSL_NRM(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_NRM static void emit_GLSL_SINCOS(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_SINCOS static void emit_GLSL_REP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_REP static void emit_GLSL_ENDREP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_ENDREP static void emit_GLSL_IF(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_IF static void emit_GLSL_IFC(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_IFC static void emit_GLSL_ELSE(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_ELSE static void emit_GLSL_ENDIF(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_ENDIF static void emit_GLSL_BREAK(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_BREAK static void emit_GLSL_BREAKC(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_BREAKC static void emit_GLSL_MOVA(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_MOVA static void emit_GLSL_DEFB(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_DEFB static void emit_GLSL_DEFI(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_DEFI static void emit_GLSL_TEXCOORD(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXCOORD static void emit_GLSL_TEXKILL(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXKILL static void emit_GLSL_TEX(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEX static void emit_GLSL_TEXBEM(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXBEM static void emit_GLSL_TEXBEML(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXBEML static void emit_GLSL_TEXREG2AR(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXREG2AR static void emit_GLSL_TEXREG2GB(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXREG2GB static void emit_GLSL_TEXM3X2PAD(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXM3X2PAD static void emit_GLSL_TEXM3X2TEX(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXM3X2TEX static void emit_GLSL_TEXM3X3PAD(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXM3X3PAD static void emit_GLSL_TEXM3X3TEX(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXM3X3TEX static void emit_GLSL_TEXM3X3SPEC(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXM3X3SPEC static void emit_GLSL_TEXM3X3VSPEC(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXM3X3VSPEC static void emit_GLSL_EXPP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_EXPP static void emit_GLSL_LOGP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_LOGP static void emit_GLSL_CND(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_CND static void emit_GLSL_DEF(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_DEF static void emit_GLSL_TEXREG2RGB(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXREG2RGB static void emit_GLSL_TEXDP3TEX(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXDP3TEX static void emit_GLSL_TEXM3X2DEPTH(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXM3X2DEPTH static void emit_GLSL_TEXDP3(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXDP3 static void emit_GLSL_TEXM3X3(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXM3X3 static void emit_GLSL_TEXDEPTH(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXDEPTH static void emit_GLSL_CMP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_CMP static void emit_GLSL_BEM(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_BEM static void emit_GLSL_DP2ADD(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_DP2ADD static void emit_GLSL_DSX(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_DSX static void emit_GLSL_DSY(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_DSY static void emit_GLSL_TEXLDD(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXLDD static void emit_GLSL_SETP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_SETP static void emit_GLSL_TEXLDL(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_TEXLDL static void emit_GLSL_BREAKP(Context *ctx) { fail(ctx, "unimplemented."); // !!! FIXME } // emit_GLSL_BREAKP static void emit_GLSL_RESERVED(Context *ctx) { // do nothing; fails in the state machine. } // emit_GLSL_RESERVED #endif // SUPPORT_PROFILE_GLSL #if !AT_LEAST_ONE_PROFILE #error No profiles are supported. Fix your build. #endif static const Profile profiles[] = { #if SUPPORT_PROFILE_D3D { "d3d", emit_D3D_start, emit_D3D_end, emit_D3D_comment }, #endif #if SUPPORT_PROFILE_GLSL { "glsl", emit_GLSL_start, emit_GLSL_end, emit_GLSL_comment }, #endif }; // The PROFILE_EMITTER_* items MUST be in the same order as profiles[]! #define PROFILE_EMITTERS(op) { \ PROFILE_EMITTER_D3D(op) \ PROFILE_EMITTER_GLSL(op) \ } static int parse_destination_token(Context *ctx, DestArgInfo *info) { // !!! FIXME: recheck against the spec for ranges (like RASTOUT values, etc). if (ctx->failstr != NULL) return FAIL; // already failed elsewhere. if (ctx->tokencount == 0) return fail(ctx, "Out of tokens in destination parameter"); const uint32 token = SWAP32(*(ctx->tokens)); const int reserved1 = (int) ((token >> 14) & 0x3); // bits 14 through 15 const int reserved2 = (int) ((token >> 31) & 0x1); // bit 31 info->token = ctx->tokens; info->regnum = (int) (token & 0x7ff); // bits 0 through 10 info->relative = (int) ((token >> 13) & 0x1); // bit 13 info->writemask = (int) ((token >> 16) & 0xF); // bits 16 through 19 info->writemask0 = (int) ((token >> 16) & 0x1); // bit 16 info->writemask1 = (int) ((token >> 17) & 0x1); // bit 17 info->writemask2 = (int) ((token >> 18) & 0x1); // bit 18 info->writemask3 = (int) ((token >> 19) & 0x1); // bit 19 info->result_mod = (int) ((token >> 20) & 0xF); // bits 20 through 23 info->result_shift = (int) ((token >> 24) & 0xF); // bits 24 through 27 info->regtype = (int) ((token >> 28) & 0x7) | ((token >> 8) & 0x18); // bits 28-30, 11-12 ctx->tokens++; // swallow token for now, for multiple calls in a row. ctx->tokencount--; // swallow token for now, for multiple calls in a row. if (reserved1 != 0x0) return fail(ctx, "Reserved bit #1 in destination token must be zero"); if (reserved2 != 0x1) return fail(ctx, "Reserved bit #2 in destination token must be one"); if (info->relative) { if (ctx->shader_type != SHADER_TYPE_VERTEX) return fail(ctx, "Relative addressing in non-vertex shader"); else if (ctx->major_ver < 3) return fail(ctx, "Relative addressing in vertex shader version < 3.0"); return fail(ctx, "Relative addressing is unsupported"); // !!! FIXME } // if const int s = info->result_shift; if (s != 0) { if (ctx->shader_type != SHADER_TYPE_PIXEL) return fail(ctx, "Result shift scale in non-pixel shader"); else if (ctx->major_ver >= 2) return fail(ctx, "Result shift scale in pixel shader version >= 2.0"); else if ( ! (((s >= 1) && (s <= 3)) || ((s >= 0xD) && (s <= 0xF))) ) return fail(ctx, "Result shift scale isn't 1 to 3, or 13 to 15."); } // if if (info->result_mod & MOD_SATURATE) // Saturate (vertex shaders only) { if (ctx->shader_type != SHADER_TYPE_VERTEX) return fail(ctx, "Saturate result mod in non-vertex shader"); } // if if (info->result_mod & MOD_PP) // Partial precision (pixel shaders only) { if (ctx->shader_type != SHADER_TYPE_PIXEL) return fail(ctx, "Partial precision result mod in non-pixel shader"); } // if if (info->result_mod & MOD_CENTROID) // Centroid (pixel shaders only) { if (ctx->shader_type != SHADER_TYPE_PIXEL) return fail(ctx, "Centroid result mod in non-pixel shader"); } // if if ((info->regtype < 0) || (info->regtype > REGISTER_TYPE_MAX)) return fail(ctx, "Register type is out of range"); return 1; } // parse_destination_token static int parse_source_token(Context *ctx, SourceArgInfo *info) { if (ctx->failstr != NULL) return FAIL; // already failed elsewhere. if (ctx->tokencount == 0) return fail(ctx, "Out of tokens in source parameter"); const uint32 token = SWAP32(*(ctx->tokens)); const int reserved1 = (int) ((token >> 14) & 0x3); // bits 14 through 15 const int reserved2 = (int) ((token >> 31) & 0x1); // bit 31 info->token = ctx->tokens; info->regnum = (int) (token & 0x7ff); // bits 0 through 10 info->relative = (int) ((token >> 13) & 0x1); // bit 13 info->swizzle = (int) ((token >> 16) & 0xFF); // bits 16 through 23 info->swizzle_x = (int) ((token >> 16) & 0x3); // bits 16 through 17 info->swizzle_y = (int) ((token >> 18) & 0x3); // bits 18 through 19 info->swizzle_z = (int) ((token >> 20) & 0x3); // bits 20 through 21 info->swizzle_w = (int) ((token >> 22) & 0x3); // bits 22 through 23 info->src_mod = (int) ((token >> 24) & 0xF); // bits 24 through 27 info->regtype = (int) ((token >> 28) & 0x7) | ((token >> 9) & 0x18); // bits 28-30, 11-12 ctx->tokens++; // swallow token for now, for multiple calls in a row. ctx->tokencount--; // swallow token for now, for multiple calls in a row. if (reserved1 != 0x0) return fail(ctx, "Reserved bits #1 in source token must be zero"); if (reserved2 != 0x1) return fail(ctx, "Reserved bit #2 in source token must be one"); if (info->relative) { if ((ctx->shader_type == SHADER_TYPE_PIXEL) && (ctx->major_ver < 3)) return fail(ctx, "Relative addressing in pixel shader version < 3.0"); return fail(ctx, "Relative addressing is unsupported"); // !!! FIXME } // if if ( ((SourceMod) info->src_mod) >= SRCMOD_TOTAL ) return fail(ctx, "Unknown source modifier"); return 1; } // parse_source_token static int parse_args_NULL(Context *ctx) { return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_NULL static int parse_args_DEF(Context *ctx) { if (parse_destination_token(ctx, &ctx->dest_args[0]) == FAIL) return FAIL; switch ((RegisterType) ctx->dest_args[0].regtype) { case REGISTER_TYPE_CONST: case REGISTER_TYPE_CONST2: case REGISTER_TYPE_CONST3: case REGISTER_TYPE_CONST4: break; default: return fail(ctx, "DEF token using invalid register"); } // switch // !!! FIXME: msdn says this can be float or int...how do we differentiate? ctx->dwords[0] = SWAP32(ctx->tokens[0]); ctx->dwords[1] = SWAP32(ctx->tokens[1]); ctx->dwords[2] = SWAP32(ctx->tokens[2]); ctx->dwords[3] = SWAP32(ctx->tokens[3]); return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_DEF static int parse_args_DEFI(Context *ctx) { if (parse_destination_token(ctx, &ctx->dest_args[0]) == FAIL) return FAIL; if (((RegisterType) ctx->dest_args[0].regtype) != REGISTER_TYPE_CONSTINT) return fail(ctx, "DEFI token using invalid register"); ctx->dwords[0] = SWAP32(ctx->tokens[0]); ctx->dwords[1] = SWAP32(ctx->tokens[1]); ctx->dwords[2] = SWAP32(ctx->tokens[2]); ctx->dwords[3] = SWAP32(ctx->tokens[3]); return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_DEFI static int parse_args_DEFB(Context *ctx) { if (parse_destination_token(ctx, &ctx->dest_args[0]) == FAIL) return FAIL; if (((RegisterType) ctx->dest_args[0].regtype) != REGISTER_TYPE_CONSTBOOL) return fail(ctx, "DEFB token using invalid register"); ctx->dwords[0] = *(ctx->tokens) ? 1 : 0; return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_DEFB static int parse_args_DCL(Context *ctx) { int unsupported = 0; const uint32 token = SWAP32(*(ctx->tokens)); const DeclUsageType usage = (DeclUsageType)(token & 0xF); const int reserved1 = (int) ((token >> 31) & 0x1); // bit 31 uint32 reserved_mask = 0x00000000; if (reserved1 != 0x1) return fail(ctx, "Bit #31 in DCL token must be one"); ctx->tokens++; ctx->tokencount--; if (parse_destination_token(ctx, &ctx->dest_args[0]) == FAIL) return FAIL; const RegisterType regtype = (RegisterType) ctx->dest_args[0].regtype; if ((ctx->shader_type == SHADER_TYPE_PIXEL) && (ctx->major_ver >= 3)) { if (regtype == REGISTER_TYPE_INPUT) reserved_mask = 0x7FFFFFFF; else if (regtype == REGISTER_TYPE_MISCTYPE) { const MiscTypeType mt = (MiscTypeType) ctx->dest_args[0].regnum; if (mt == MISCTYPE_TYPE_POSITION) reserved_mask = 0x7FFFFFFF; else if (mt == MISCTYPE_TYPE_FACE) { reserved_mask = 0x7FFFFFFF; if (ctx->dest_args[0].writemask != 0xF) return fail(ctx, "DCL face writemask must be full"); else if (ctx->dest_args[0].result_mod != 0) return fail(ctx, "DCL face result modifier must be zero"); else if (ctx->dest_args[0].result_shift != 0) return fail(ctx, "DCL face shift scale must be zero"); } // else if else { unsupported = 1; } // else } // else if else if (regtype == REGISTER_TYPE_TEXTURE) { const uint32 usage = (token & 0xF); const uint32 index = ((token >> 16) & 0xF); if (usage == DECLUSAGE_TEXCOORD) { if (index > 7) return fail(ctx, "DCL texcoord usage must have 0-7 index"); } // if else if (usage == DECLUSAGE_COLOR) { if (index != 0) return fail(ctx, "DCL color usage must have 0 index"); } // else if else { return fail(ctx, "Invalid DCL texture usage"); } // else reserved_mask = 0x7FF0FFE0; ctx->dwords[0] = usage; ctx->dwords[1] = index; } // else if else if (regtype == REGISTER_TYPE_SAMPLER) { reserved_mask = 0x7FFFFFF; ctx->dwords[0] = ((token >> 27) & 0xF); // TextureType } // else if else { unsupported = 1; } // else } // if else if ((ctx->shader_type == SHADER_TYPE_PIXEL) && (ctx->major_ver >= 2)) { if (regtype == REGISTER_TYPE_INPUT) reserved_mask = 0x7FFFFFFF; else if (regtype == REGISTER_TYPE_TEXTURE) reserved_mask = 0x7FFFFFFF; else if (regtype == REGISTER_TYPE_SAMPLER) { reserved_mask = 0x7FFFFFF; ctx->dwords[0] = ((token >> 27) & 0xF); // TextureType } // else if else { unsupported = 1; } // else } // if else if ((ctx->shader_type == SHADER_TYPE_VERTEX) && (ctx->major_ver >= 3)) { if ((regtype==REGISTER_TYPE_INPUT) || (regtype==REGISTER_TYPE_OUTPUT)) { const uint32 usage = (token & 0xF); const uint32 index = ((token >> 16) & 0xF); reserved_mask = 0x7FF0FFE0; ctx->dwords[0] = usage; ctx->dwords[1] = index; } // if else { unsupported = 1; } // else } // else if else if ((ctx->shader_type == SHADER_TYPE_VERTEX) && (ctx->major_ver >= 2)) { if (regtype == REGISTER_TYPE_INPUT) { const uint32 usage = (token & 0xF); const uint32 index = ((token >> 16) & 0xF); reserved_mask = 0x7FF0FFE0; ctx->dwords[0] = usage; ctx->dwords[1] = index; } // if else { unsupported = 1; } // else } // else if else { unsupported = 1; } // else if (unsupported) return fail(ctx, "invalid DCL register type for this shader model"); if ((token & reserved_mask) != 0) return fail(ctx, "reserved bits in DCL dword aren't zero"); return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_DCL static int parse_args_D(Context *ctx) { if (parse_destination_token(ctx, &ctx->dest_args[0]) == FAIL) return FAIL; return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_D static int parse_args_S(Context *ctx) { if (parse_source_token(ctx, &ctx->source_args[0]) == FAIL) return FAIL; return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_S static int parse_args_SS(Context *ctx) { if (parse_source_token(ctx, &ctx->source_args[0]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[1]) == FAIL) return FAIL; return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_SS static int parse_args_DS(Context *ctx) { if (parse_destination_token(ctx, &ctx->dest_args[0]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[0]) == FAIL) return FAIL; return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_DS static int parse_args_DSS(Context *ctx) { if (parse_destination_token(ctx, &ctx->dest_args[0]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[0]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[1]) == FAIL) return FAIL; return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_DSS static int parse_args_DSSS(Context *ctx) { if (parse_destination_token(ctx, &ctx->dest_args[0]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[0]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[1]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[2]) == FAIL) return FAIL; return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_DSSS static int parse_args_DSSSS(Context *ctx) { if (parse_destination_token(ctx, &ctx->dest_args[0]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[0]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[1]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[2]) == FAIL) return FAIL; if (parse_source_token(ctx, &ctx->source_args[3]) == FAIL) return FAIL; return ((ctx->failstr != NULL) ? FAIL : 0); } // parse_args_DSSSS // State machine functions... static int state_RESERVED(Context *ctx) { return fail(ctx, "Tried to use RESERVED opcode."); } // state_RESERVED // Lookup table for instruction opcodes... typedef struct { const char *opcode_string; int arg_tokens; args_function parse_args; state_function state; emit_function emitter[STATICARRAYLEN(profiles)]; } Instruction; // These have to be in the right order! This array is indexed by the value // of the instruction token. static Instruction instructions[] = { // INSTRUCTION_STATE means this opcode has to update the state machine // (we're entering an ELSE block, etc). INSTRUCTION means there's no // state, just go straight to the emitters. #define INSTRUCTION_STATE(op, args, argsseq) { \ #op, args, parse_args_##argsseq, state_##op, PROFILE_EMITTERS(op) \ } #define INSTRUCTION(op, args, argsseq) { \ #op, args, parse_args_##argsseq, NULL, PROFILE_EMITTERS(op) \ } INSTRUCTION(NOP, 0, NULL), INSTRUCTION(MOV, 2, DS), INSTRUCTION(ADD, 3, DSS), INSTRUCTION(SUB, 3, DSS), INSTRUCTION(MAD, 4, DSSS), INSTRUCTION(MUL, 3, DSS), INSTRUCTION(RCP, 2, DS), INSTRUCTION(RSQ, 2, DS), INSTRUCTION(DP3, 3, DSS), INSTRUCTION(DP4, 3, DSS), INSTRUCTION(MIN, 3, DSS), INSTRUCTION(MAX, 3, DSS), INSTRUCTION(SLT, 3, DSS), INSTRUCTION(SGE, 3, DSS), INSTRUCTION(EXP, 2, DS), INSTRUCTION(LOG, 2, DS), INSTRUCTION(LIT, 2, DS), INSTRUCTION(DST, 3, DSS), INSTRUCTION(LRP, 4, DSSS), INSTRUCTION(FRC, 2, DS), INSTRUCTION(M4X4, 3, DSS), INSTRUCTION(M4X3, 3, DSS), INSTRUCTION(M3X4, 3, DSS), INSTRUCTION(M3X3, 3, DSS), INSTRUCTION(M3X2, 3, DSS), INSTRUCTION(CALL, 1, S), INSTRUCTION(CALLNZ, 2, SS), INSTRUCTION(LOOP, 2, SS), INSTRUCTION(RET, 0, NULL), INSTRUCTION(ENDLOOP, 0, NULL), INSTRUCTION(LABEL, 1, S), INSTRUCTION(DCL, 2, DCL), INSTRUCTION(POW, 3, DSS), INSTRUCTION(CRS, 3, DSS), INSTRUCTION(SGN, 4, DSSS), INSTRUCTION(ABS, 2, DS), INSTRUCTION(NRM, 2, DS), INSTRUCTION(SINCOS, 4, NULL), INSTRUCTION(REP, 1, S), INSTRUCTION(ENDREP, 0, NULL), INSTRUCTION(IF, 1, S), INSTRUCTION(IFC, 2, SS), INSTRUCTION(ELSE, 0, NULL), INSTRUCTION(ENDIF, 0, NULL), INSTRUCTION(BREAK, 0, NULL), INSTRUCTION(BREAKC, 2, SS), INSTRUCTION(MOVA, 2, DS), INSTRUCTION(DEFB, 2, DEFB), INSTRUCTION(DEFI, 5, DEFI), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION(TEXCOORD, -1, NULL), INSTRUCTION(TEXKILL, 1, D), INSTRUCTION(TEX, -1, NULL), INSTRUCTION(TEXBEM, 2, DS), INSTRUCTION(TEXBEML, 2, DS), INSTRUCTION(TEXREG2AR, 2, DS), INSTRUCTION(TEXREG2GB, 2, DS), INSTRUCTION(TEXM3X2PAD, 2, DS), INSTRUCTION(TEXM3X2TEX, 2, DS), INSTRUCTION(TEXM3X3PAD, 2, DS), INSTRUCTION(TEXM3X3TEX, 2, DS), INSTRUCTION_STATE(RESERVED, 0, NULL), INSTRUCTION(TEXM3X3SPEC, 3, DSS), INSTRUCTION(TEXM3X3VSPEC, 2, DS), INSTRUCTION(EXPP, 2, DS), INSTRUCTION(LOGP, 2, DS), INSTRUCTION(CND, 4, DSSS), INSTRUCTION(DEF, 5, DEF), INSTRUCTION(TEXREG2RGB, 2, DS), INSTRUCTION(TEXDP3TEX, 2, DS), INSTRUCTION(TEXM3X2DEPTH, 2, DS), INSTRUCTION(TEXDP3, 2, DS), INSTRUCTION(TEXM3X3, 2, DS), INSTRUCTION(TEXDEPTH, 1, D), INSTRUCTION(CMP, 4, DSSS), INSTRUCTION(BEM, 3, DSS), INSTRUCTION(DP2ADD, 4, DSSS), INSTRUCTION(DSX, 2, DS), INSTRUCTION(DSY, 2, DS), INSTRUCTION(TEXLDD, 5, DSSSS), INSTRUCTION(SETP, 3, DSS), INSTRUCTION(TEXLDL, 3, DSS), INSTRUCTION(BREAKP, 1, S), // src #undef INSTRUCTION #undef INSTRUCTION_STATE }; // parse various token types... static int parse_instruction_token(Context *ctx) { const uint32 *start_tokens = ctx->tokens; const uint32 start_tokencount = ctx->tokencount; const uint32 token = SWAP32(*(ctx->tokens)); const uint32 opcode = (token & 0xFFFF); const uint32 controls = ((token >> 16) & 0xFF); const uint32 insttoks = ((token >> 24) & 0x0F); const int coissue = (token & 0x40000000) ? 1 : 0; const int predicated = (token & 0x10000000) ? 1 : 0; const Instruction *instruction = &instructions[opcode]; const emit_function emitter = instruction->emitter[ctx->profileid]; int retval = FAIL; if ( opcode >= (sizeof (instructions) / sizeof (instructions[0])) ) return 0; // not an instruction token, or just not handled here. if ((token & 0x80000000) != 0) return fail(ctx, "instruction token high bit must be zero."); // so says msdn. if (coissue) // !!! FIXME: I'm not sure what this means, yet. return fail(ctx, "coissue instructions unsupported"); if (ctx->major_ver < 2) { if (insttoks != 0) // this is a reserved field in shaders < 2.0 ... return fail(ctx, "instruction token count must be zero"); } // if else if (instruction->arg_tokens >= 0) { if (instruction->arg_tokens != insttoks) { return failf(ctx, "unexpected tokens count (%u) for opcode '%s'.", (uint) insttoks, instruction->opcode_string); } // if else if (ctx->tokencount <= instruction->arg_tokens) { return failf(ctx, "need more tokens (need %u, got %u) for opcode '%s'.", (uint) instruction->arg_tokens, (uint) ctx->tokencount, instruction->opcode_string); } // else if } // else if ctx->instruction_count++; ctx->instruction_controls = controls; // Update the context with instruction's arguments. ctx->tokens++; ctx->tokencount--; if (instruction->parse_args(ctx) == FAIL) return FAIL; // parse_args() moves these forward for convenience...reset them. ctx->tokens = start_tokens; ctx->tokencount = start_tokencount; if (instruction->state != NULL) // update state machine retval = instruction->state(ctx); else { // !!! FIXME //assert(instruction->arg_tokens >= 0); //retval = instruction->arg_tokens + 1; retval = insttoks + 1; } // else if (retval != FAIL) // only do this if there wasn't a previous fail. emitter(ctx); // call the profile's emitter. return retval; } // parse_instruction_token static int parse_version_token(Context *ctx) { if (ctx->tokencount == 0) return fail(ctx, "Expected version token, got none at all."); const uint32 token = SWAP32(*(ctx->tokens)); const uint32 shadertype = ((token >> 16) & 0xFFFF); const uint32 major = (uint32) ((token >> 8) & 0xFF); const uint32 minor = (uint32) (token & 0xFF); // 0xFFFF == pixel shader, 0xFFFE == vertex shader if (shadertype == 0xFFFF) ctx->shader_type = SHADER_TYPE_PIXEL; else if (shadertype == 0xFFFE) ctx->shader_type = SHADER_TYPE_VERTEX; else // geometry shader? Bogus data? return fail(ctx, "Unsupported shader type or not a shader at all"); ctx->major_ver = major; ctx->minor_ver = minor; if (!SHADER_VERSION_SUPPORTED(major, minor)) { return failf(ctx, "Shader Model %u.%u is currently unsupported.", (uint) major, (uint) minor); } // if ctx->profile->start_emitter(ctx); return 1; // ate one token. } // parse_version_token static int parse_comment_token(Context *ctx) { const uint32 token = SWAP32(*(ctx->tokens)); if ((token & 0xFFFF) != 0xFFFE) return 0; // not a comment token. else if ((token & 0x80000000) != 0) return fail(ctx, "comment token high bit must be zero."); // so says msdn. else { const uint32 commenttoks = ((token >> 16) & 0xFFFF); const uint32 len = commenttoks * sizeof (uint32); const int needmalloc = (len >= SCRATCH_BUFFER_SIZE); char *str = ((needmalloc) ? (char *) ctx->malloc(len + 1) : get_scratch_buffer(ctx)); memcpy(str, (const char *) (ctx->tokens+1), len); str[len] = '\0'; ctx->profile->comment_emitter(ctx, str); if (needmalloc) ctx->free(str); return commenttoks + 1; // comment data plus the initial token. } // else // shouldn't hit this. return failf(ctx, "Logic error at %s:%d", __FILE__, __LINE__); } // parse_comment_token static int parse_end_token(Context *ctx) { if (SWAP32(*(ctx->tokens)) != 0x0000FFFF) // end token always 0x0000FFFF. return 0; // not us, eat no tokens. if (ctx->tokencount != 1) // we _must_ be last. If not: fail. return fail(ctx, "end token before end of stream"); ctx->profile->end_emitter(ctx); return END_OF_STREAM; } // parse_end_token static int parse_phase_token(Context *ctx) { if (SWAP32(*(ctx->tokens)) != 0x0000FFFD) // phase token always 0x0000FFFD. return 0; // not us, eat no tokens. return fail(ctx, "not sure what this thing is yet."); } // parse_phase_token static int parse_token(Context *ctx) { int rc = 0; if (ctx->failstr != NULL) return FAIL; // just in case...catch previously unhandled fails here. if (ctx->tokencount == 0) return fail(ctx, "unexpected end of shader."); if ((rc = parse_comment_token(ctx)) != 0) return rc; if ((rc = parse_end_token(ctx)) != 0) return rc; if ((rc = parse_phase_token(ctx)) != 0) return rc; if ((rc = parse_instruction_token(ctx)) != 0) return rc; return failf(ctx, "unknown token (%u)", (uint) *ctx->tokens); } // parse_token static void *internal_malloc(int bytes) { return malloc(bytes); } static void internal_free(void *ptr) { free(ptr); } static int find_profile_id(const char *profile) { int i; for (i = 0; i < STATICARRAYLEN(profiles); i++) { const char *name = profiles[i].name; if (strcmp(name, profile) == 0) return i; } // for return -1; // no match. } // find_profile_id static Context *build_context(const char *profile, const unsigned char *tokenbuf, const unsigned int bufsize, MOJOSHADER_malloc m, MOJOSHADER_free f) { if (m == NULL) m = internal_malloc; if (f == NULL) f = internal_free; Context *ctx = m(sizeof (Context)); if (ctx == NULL) return NULL; memset(ctx, '\0', sizeof (Context)); ctx->malloc = m; ctx->free = f; ctx->tokens = (const uint32 *) tokenbuf; ctx->tokencount = bufsize / sizeof (uint32); ctx->endline = "\n"; ctx->endline_len = 1; // !!! FIXME: do "\r\n" on Windows? ctx->output.str = NULL; ctx->output.next = NULL; ctx->output_tail = &ctx->output; const int profileid = find_profile_id(profile); ctx->profileid = profileid; if (profileid >= 0) // we'll fail later, but we still need the context! ctx->profile = &profiles[profileid]; return ctx; } // build_context static void destroy_context(Context *ctx) { OutputList *item = ctx->output.next; while (item != NULL) { OutputList *next = item->next; ctx->free(item->str); ctx->free(item); item = next; } // for if (ctx->failstr != out_of_mem_string) ctx->free((void *) ctx->failstr); ctx->free(ctx); } // destroy_context static char *build_output(Context *ctx) { char *retval = (char *) ctx->malloc(ctx->output_len + 1); if (retval == NULL) out_of_memory(ctx); else { const char *endline = ctx->endline; const size_t endline_len = ctx->endline_len; char *wptr = retval; OutputList *item = ctx->output.next; while (item != NULL) { const size_t len = strlen(item->str); memcpy(wptr, item->str, len); wptr += len; memcpy(wptr, endline, endline_len); wptr += endline_len; item = item->next; } // while *wptr = '\0'; } // else return retval; } // build_output // API entry point... int MOJOSHADER_parse(const char *profile, const unsigned char *tokenbuf, const unsigned int bufsize, MOJOSHADER_malloc m, MOJOSHADER_free f) { int rc = FAIL; Context *ctx = build_context(profile, tokenbuf, bufsize, m, f); if (ctx == NULL) return 0; // !!! FIXME: error string? if (ctx->profile == NULL) failf(ctx, "Profile '%s' is unknown or unsupported", profile); if (ctx->failstr == NULL) // only go on if there was no previous error... { // Version token always comes first. rc = parse_version_token(ctx); // parse out the rest of the tokens after the version token... while (rc > 0) { ctx->tokens += rc; ctx->tokencount -= rc; rc = parse_token(ctx); } // while } // if // if (ctx->failstr == NULL) { char *str = build_output(ctx); if (str != NULL) { printf("OUTPUT:\n%s\n", str); // !!! FIXME: report to caller. ctx->free(str); } // if printf("INSTRUCTION COUNT: %u\n", (uint) ctx->instruction_count); } // if if (ctx->failstr != NULL) printf("FAIL: %s\n", ctx->failstr); destroy_context(ctx); return (rc == END_OF_STREAM); } // MOJOSHADER_parse int MOJOSHADER_version(void) { return MOJOSHADER_VERSION; } // MOJOSHADER_version // end of mojoshader.c ...