#include "quakedef.h" //#define FORCESTATE void DumpGLState(void); #ifdef GLQUAKE #define r_refract_fboival gl_config.ext_framebuffer_objects #include "glquake.h" #include "shader.h" #ifdef _WIN32 #include #else #include #endif #ifdef FORCESTATE #pragma warningmsg("FORCESTATE is active") #endif #ifdef ANDROID /*android appears to have a bug, and requires f and not i*/ #define qglTexEnvi qglTexEnvf #endif extern cvar_t gl_overbright; extern cvar_t gl_ati_truform; extern cvar_t r_wireframe; static const char LIGHTPASS_SHADER[] = "\ {\n\ program rtlight%s\n\ \ {\n\ map $diffuse\n\ blendfunc add\n\ }\n\ {\n\ map $normalmap\n\ }\n\ {\n\ map $specular\n\ }\n\ {\n\ map $lightcubemap\n\ }\n\ {\n\ map $shadowmap\n\ }\n\ {\n\ map $loweroverlay\n\ }\n\ {\n\ map $upperoverlay\n\ }\n\ }"; enum { LSHADER_STANDARD, LSHADER_CUBE, LSHADER_SMAP, LSHADER_SPOT, LSHADER_MODES }; extern cvar_t r_glsl_offsetmapping, r_noportals; static void BE_SendPassBlendDepthMask(unsigned int sbits); void GLBE_SubmitBatch(batch_t *batch); static qboolean GLBE_RegisterLightShader(int mode); struct { //internal state struct { int lastpasstmus; // int vbo_colour; // int vbo_texcoords[SHADER_PASS_MAX]; // int vbo_deforms; //holds verticies... in case you didn't realise. const shader_t *shader_light[1u<polyoffset.factor; po.unit = shaderstate.curshader->polyoffset.unit; if (pushdepth) { /*some quake doors etc are flush with the walls that they're meant to be hidden behind, or plats the same height as the floor, etc we move them back very slightly using polygonoffset to avoid really ugly z-fighting*/ extern cvar_t r_polygonoffset_submodel_offset, r_polygonoffset_submodel_factor; po.factor += r_polygonoffset_submodel_factor.value; po.unit += r_polygonoffset_submodel_offset.value; } if (shaderstate.mode == BEM_DEPTHONLY) { po.factor += 5; po.unit += 25; } #ifndef FORCESTATE if (shaderstate.curpolyoffset.factor != po.factor || shaderstate.curpolyoffset.unit != po.unit) #endif { shaderstate.curpolyoffset = po; if (shaderstate.curpolyoffset.factor || shaderstate.curpolyoffset.unit) { qglEnable(GL_POLYGON_OFFSET_FILL); qglPolygonOffset(shaderstate.curpolyoffset.factor, shaderstate.curpolyoffset.unit); } else qglDisable(GL_POLYGON_OFFSET_FILL); } } void GL_TexEnv(GLenum mode) { #ifndef FORCESTATE if (mode != shaderstate.texenvmode[shaderstate.currenttmu]) #endif { qglTexEnvi(GL_TEXTURE_ENV, GL_TEXTURE_ENV_MODE, mode); shaderstate.texenvmode[shaderstate.currenttmu] = mode; } } static void BE_SetPassBlendMode(int tmu, int pbm) { #ifndef FORCESTATE if (shaderstate.blendmode[tmu] != pbm) #endif { shaderstate.blendmode[tmu] = pbm; #ifndef FORCESTATE if (shaderstate.currenttmu != tmu) #endif GL_SelectTexture(tmu); switch (pbm) { case PBM_DOTPRODUCT: GL_TexEnv(GL_COMBINE_ARB); qglTexEnvi(GL_TEXTURE_ENV, GL_SOURCE0_RGB_ARB, GL_TEXTURE); qglTexEnvi(GL_TEXTURE_ENV, GL_SOURCE1_RGB_ARB, GL_PREVIOUS_ARB); qglTexEnvi(GL_TEXTURE_ENV, GL_COMBINE_RGB_ARB, GL_DOT3_RGB_ARB); qglTexEnvf(GL_TEXTURE_ENV, GL_RGB_SCALE_ARB, 1); break; case PBM_MODULATE_PREV_COLOUR: GL_TexEnv(GL_COMBINE_ARB); qglTexEnvi(GL_TEXTURE_ENV, GL_SOURCE0_RGB_ARB, GL_PRIMARY_COLOR_ARB); qglTexEnvi(GL_TEXTURE_ENV, GL_SOURCE1_RGB_ARB, GL_PREVIOUS_ARB); qglTexEnvi(GL_TEXTURE_ENV, GL_COMBINE_RGB_ARB, GL_MODULATE); qglTexEnvf(GL_TEXTURE_ENV, GL_RGB_SCALE_ARB, 1); break; case PBM_REPLACELIGHT: if (shaderstate.identitylighting != 1) goto forcemod; GL_TexEnv(GL_REPLACE); break; case PBM_REPLACE: GL_TexEnv(GL_REPLACE); break; case PBM_DECAL: if (tmu == 0) goto forcemod; GL_TexEnv(GL_DECAL); break; case PBM_ADD: if (tmu == 0) goto forcemod; GL_TexEnv(GL_ADD); break; case PBM_OVERBRIGHT: GL_TexEnv(GL_COMBINE_ARB); qglTexEnvi(GL_TEXTURE_ENV, GL_SOURCE0_RGB_ARB, GL_TEXTURE); qglTexEnvi(GL_TEXTURE_ENV, GL_SOURCE1_RGB_ARB, GL_PREVIOUS_ARB); qglTexEnvi(GL_TEXTURE_ENV, GL_COMBINE_RGB_ARB, GL_MODULATE); qglTexEnvf(GL_TEXTURE_ENV, GL_RGB_SCALE_ARB, 1<shaderTime; } void GL_SelectTexture(int target) { shaderstate.currenttmu = target; if (qglActiveTextureARB) qglActiveTextureARB(target + mtexid0); else if (qglSelectTextureSGIS) qglSelectTextureSGIS(target + mtexid0); } void GL_SelectVBO(int vbo) { #ifndef FORCESTATE if (shaderstate.currentvbo != vbo) #endif { shaderstate.currentvbo = vbo; qglBindBufferARB(GL_ARRAY_BUFFER_ARB, shaderstate.currentvbo); } } void GL_DeselectVAO(void) { if (shaderstate.currentvao) { qglBindVertexArray(0); shaderstate.currentvao = 0; } } void GL_SelectEBO(int vbo) { //EBO is part of the current VAO, so keep things matching that #ifndef FORCESTATE if (shaderstate.currentebo != vbo) #endif { shaderstate.currentebo = vbo; qglBindBufferARB(GL_ELEMENT_ARRAY_BUFFER_ARB, shaderstate.currentebo); } } void GL_MTBind(int tmu, int target, texid_t texnum) { GL_SelectTexture(tmu); #ifndef FORCESTATE if (shaderstate.currenttextures[tmu] == texnum.num) return; #endif shaderstate.currenttextures[tmu] = texnum.num; if (target) qglBindTexture (target, texnum.num); if ( #ifndef FORCESTATE shaderstate.curtexturetype[tmu] != target && #endif !gl_config.nofixedfunc) { if (shaderstate.curtexturetype[tmu]) qglDisable(shaderstate.curtexturetype[tmu]); shaderstate.curtexturetype[tmu] = target; if (target) qglEnable(target); } } void GL_LazyBind(int tmu, int target, texid_t texnum) { #ifndef FORCESTATE if (shaderstate.currenttextures[tmu] != texnum.num) #endif { GL_SelectTexture(tmu); shaderstate.currenttextures[shaderstate.currenttmu] = texnum.num; #ifndef FORCESTATE if (shaderstate.curtexturetype[tmu] != target) #endif { if (shaderstate.curtexturetype[tmu]) qglBindTexture (shaderstate.curtexturetype[tmu], texnum.num); if (gl_config.nofixedfunc) { shaderstate.curtexturetype[tmu] = target; } else { if (shaderstate.curtexturetype[tmu]) qglDisable(shaderstate.curtexturetype[tmu]); shaderstate.curtexturetype[tmu] = target; if (target) qglEnable(target); } } if (target) qglBindTexture (target, texnum.num); } } static void BE_ApplyAttributes(unsigned int bitstochange, unsigned int bitstoendisable) { unsigned int i; //legacy colour attribute (including flat shaded) if ((bitstochange) & (1u<= (1u<= (1u<coord2.gl.vbo && !shaderstate.sourcevbo->coord2.gl.addr) { GL_SelectVBO(shaderstate.pendingvertexvbo); qglVertexAttribPointer(i, 3, GL_FLOAT, GL_FALSE, VECV_STRIDE, shaderstate.pendingvertexpointer); } else { GL_SelectVBO(shaderstate.sourcevbo->coord2.gl.vbo); qglVertexAttribPointer(VATTR_VERTEX2, 3, GL_FLOAT, GL_FALSE, VECV_STRIDE, shaderstate.sourcevbo->coord2.gl.addr); } break; case VATTR_COLOUR: if (shaderstate.sourcevbo->colours.gl.addr) { GL_SelectVBO(shaderstate.sourcevbo->colours.gl.vbo); qglVertexAttribPointer(VATTR_COLOUR, 4, shaderstate.colourarraytype, ((shaderstate.colourarraytype==GL_FLOAT)?GL_FALSE:GL_TRUE), 0, shaderstate.sourcevbo->colours.gl.addr); break; } break; case VATTR_TEXCOORD: GL_SelectVBO(shaderstate.sourcevbo->texcoord.gl.vbo); qglVertexAttribPointer(VATTR_TEXCOORD, 2, GL_FLOAT, GL_FALSE, 0, shaderstate.sourcevbo->texcoord.gl.addr); break; case VATTR_LMCOORD: if (!shaderstate.sourcevbo->lmcoord[0].gl.vbo && !shaderstate.sourcevbo->lmcoord[0].gl.addr) { GL_SelectVBO(shaderstate.sourcevbo->texcoord.gl.vbo); qglVertexAttribPointer(VATTR_LMCOORD, 2, GL_FLOAT, GL_FALSE, 0, shaderstate.sourcevbo->texcoord.gl.addr); } else { GL_SelectVBO(shaderstate.sourcevbo->lmcoord[0].gl.vbo); qglVertexAttribPointer(VATTR_LMCOORD, 2, GL_FLOAT, GL_FALSE, 0, shaderstate.sourcevbo->lmcoord[0].gl.addr); } break; case VATTR_LMCOORD2: GL_SelectVBO(shaderstate.sourcevbo->lmcoord[1].gl.vbo); qglVertexAttribPointer(VATTR_LMCOORD2, 2, GL_FLOAT, GL_FALSE, 0, shaderstate.sourcevbo->lmcoord[1].gl.addr); break; case VATTR_LMCOORD3: GL_SelectVBO(shaderstate.sourcevbo->lmcoord[2].gl.vbo); qglVertexAttribPointer(VATTR_LMCOORD3, 2, GL_FLOAT, GL_FALSE, 0, shaderstate.sourcevbo->lmcoord[2].gl.addr); break; case VATTR_LMCOORD4: GL_SelectVBO(shaderstate.sourcevbo->lmcoord[3].gl.vbo); qglVertexAttribPointer(VATTR_LMCOORD4, 2, GL_FLOAT, GL_FALSE, 0, shaderstate.sourcevbo->lmcoord[3].gl.addr); break; case VATTR_NORMALS: if (!shaderstate.sourcevbo->normals.gl.addr) { shaderstate.sha_attr &= ~(1u<normals.gl.vbo); qglVertexAttribPointer(VATTR_NORMALS, 3, GL_FLOAT, GL_FALSE, 0, shaderstate.sourcevbo->normals.gl.addr); break; case VATTR_SNORMALS: if (!shaderstate.sourcevbo->svector.gl.addr) { shaderstate.sha_attr &= ~(1u<svector.gl.vbo); qglVertexAttribPointer(VATTR_SNORMALS, 3, GL_FLOAT, GL_FALSE, 0, shaderstate.sourcevbo->svector.gl.addr); break; case VATTR_TNORMALS: if (!shaderstate.sourcevbo->tvector.gl.addr) { shaderstate.sha_attr &= ~(1u<tvector.gl.vbo); qglVertexAttribPointer(VATTR_TNORMALS, 3, GL_FLOAT, GL_FALSE, 0, shaderstate.sourcevbo->tvector.gl.addr); break; case VATTR_BONENUMS: GL_SelectVBO(shaderstate.sourcevbo->bonenums.gl.vbo); qglVertexAttribPointer(VATTR_BONENUMS, 4, GL_UNSIGNED_BYTE, GL_FALSE, 0, shaderstate.sourcevbo->bonenums.gl.addr); break; case VATTR_BONEWEIGHTS: GL_SelectVBO(shaderstate.sourcevbo->boneweights.gl.vbo); qglVertexAttribPointer(VATTR_BONEWEIGHTS, 4, GL_FLOAT, GL_FALSE, 0, shaderstate.sourcevbo->boneweights.gl.addr); break; } if ((bitstoendisable) & (1u<vaodynamic&progattrmask; #if 0 bitstoendisable = 0; #else bitstoendisable = shaderstate.sourcevbo->vaoenabled^progattrmask; if (bitstoendisable) bitstochange |= bitstoendisable; shaderstate.sourcevbo->vaoenabled = progattrmask; #endif if (bitstochange & (1u<indicies.gl.vbo); } } else { bitstochange = progattrmask; bitstoendisable = progattrmask^shaderstate.sha_attr; shaderstate.sha_attr = progattrmask; #ifndef FORCESTATE if (shaderstate.currentebo != shaderstate.sourcevbo->indicies.gl.vbo) #endif { shaderstate.currentebo = shaderstate.sourcevbo->indicies.gl.vbo; qglBindBufferARB(GL_ELEMENT_ARRAY_BUFFER_ARB, shaderstate.currentebo); } } if (bitstochange || bitstoendisable) BE_ApplyAttributes(bitstochange, bitstoendisable); } void GLBE_SetupVAO(vbo_t *vbo, unsigned int vaodynamic, unsigned int vaostatic) { if (qglGenVertexArrays) { qglGenVertexArrays(1, &vbo->vao); if ((vaostatic & VATTR_VERTEX1) && !gl_config.nofixedfunc) vaostatic = (vaostatic & ~VATTR_VERTEX1) | VATTR_LEG_VERTEX; if ((vaodynamic & VATTR_VERTEX1) && !gl_config.nofixedfunc) vaodynamic = (vaodynamic & ~VATTR_VERTEX1) | VATTR_LEG_VERTEX; shaderstate.curvertexpointer = NULL; shaderstate.curvertexvbo = 0; shaderstate.sourcevbo = vbo; shaderstate.pendingvertexvbo = shaderstate.sourcevbo->coord.gl.vbo; shaderstate.pendingvertexpointer = shaderstate.sourcevbo->coord.gl.addr; shaderstate.colourarraytype = GL_FLOAT; shaderstate.currentvao = vbo->vao; qglBindVertexArray(vbo->vao); qglBindBufferARB(GL_ELEMENT_ARRAY_BUFFER_ARB, shaderstate.sourcevbo->indicies.gl.vbo); BE_ApplyAttributes(vaostatic, vaodynamic|vaostatic); GL_SelectVBO(shaderstate.sourcevbo->coord.gl.vbo); vbo->vaoenabled = vaodynamic|vaostatic; vbo->vaodynamic = vaodynamic; shaderstate.curvertexpointer = NULL; shaderstate.curvertexvbo = 0; } else { GL_DeselectVAO(); /*always select the coord vbo and indicies ebo, for easy bufferdata*/ GL_SelectEBO(vbo->indicies.gl.vbo); GL_SelectVBO(vbo->coord.gl.vbo); } } void GL_SelectProgram(int program) { if (shaderstate.currentprogram != program) { qglUseProgramObjectARB(program); shaderstate.currentprogram = program; } } static void GL_DeSelectProgram(void) { if (shaderstate.currentprogram != 0) { qglUseProgramObjectARB(0); shaderstate.currentprogram = 0; } } void GLBE_RenderShadowBuffer(unsigned int numverts, int vbo, vecV_t *verts, unsigned numindicies, int ibo, index_t *indicies) { shaderstate.pendingvertexvbo = vbo; shaderstate.pendingvertexpointer = verts; shaderstate.sourcevbo = &shaderstate.dummyvbo; shaderstate.dummyvbo.indicies.gl.vbo = ibo; if (shaderstate.allblackshader) { GL_SelectProgram(shaderstate.allblackshader); BE_EnableShaderAttributes(gl_config.nofixedfunc?(1u<topcolour; if (cv >= 16) { *retred = (((cv&0xff0000)>>16)**((unsigned char*)&d_8to24rgbtable[15]+0))>>8; *retgreen = (((cv&0x00ff00)>>8)**((unsigned char*)&d_8to24rgbtable[15]+1))>>8; *retblue = (((cv&0x0000ff)>>0)**((unsigned char*)&d_8to24rgbtable[15]+2))>>8; return; } if (cv >= 0) i = cv; else i = TOP_RANGE>>4; if (i > 8) { i<<=4; } else { i<<=4; i+=15; } i*=3; *retred = host_basepal[i+0]; *retgreen = host_basepal[i+1]; *retblue = host_basepal[i+2]; /* if (!gammaworks) { *retred = gammatable[*retred]; *retgreen = gammatable[*retgreen]; *retblue = gammatable[*retblue]; }*/ } void R_FetchBottomColour(int *retred, int *retgreen, int *retblue) { int i; unsigned int cv = shaderstate.curentity->bottomcolour; if (cv >= 16) { *retred = (((cv&0xff0000)>>16)**((unsigned char*)&d_8to24rgbtable[15]+0))>>8; *retgreen = (((cv&0x00ff00)>>8)**((unsigned char*)&d_8to24rgbtable[15]+1))>>8; *retblue = (((cv&0x0000ff)>>0)**((unsigned char*)&d_8to24rgbtable[15]+2))>>8; return; } if (cv >= 0) i = cv; else i = BOTTOM_RANGE>>4; if (i > 8) { i<<=4; } else { i<<=4; i+=15; } i*=3; *retred = host_basepal[i+0]; *retgreen = host_basepal[i+1]; *retblue = host_basepal[i+2]; /* if (!gammaworks) { *retred = gammatable[*retred]; *retgreen = gammatable[*retgreen]; *retblue = gammatable[*retblue]; }*/ } static void RevertToKnownState(void) { if (shaderstate.currentvao) qglBindVertexArray(0); shaderstate.currentvao = 0; shaderstate.curvertexvbo = ~0; GL_SelectVBO(0); // GL_SelectEBO(0); while(shaderstate.lastpasstmus>0) { GL_LazyBind(--shaderstate.lastpasstmus, 0, r_nulltex); } GL_SelectTexture(0); if (!gl_config.nofixedfunc) { BE_SetPassBlendMode(0, PBM_REPLACE); qglColor3f(1,1,1); GL_DeSelectProgram(); } shaderstate.shaderbits &= ~(SBITS_MISC_DEPTHEQUALONLY|SBITS_MISC_DEPTHCLOSERONLY|SBITS_MASK_BITS); shaderstate.shaderbits |= SBITS_MISC_DEPTHWRITE; shaderstate.shaderbits &= ~(SBITS_BLEND_BITS); qglDisable(GL_BLEND); qglDepthFunc(GL_LEQUAL); qglDepthMask(GL_TRUE); qglColorMask(GL_TRUE, GL_TRUE, GL_TRUE, GL_TRUE); } void PPL_RevertToKnownState(void) { RevertToKnownState(); } void R_IBrokeTheArrays(void) { RevertToKnownState(); } #ifdef RTLIGHTS //called from gl_shadow void GLBE_SetupForShadowMap(texid_t shadowmaptex, int texwidth, int texheight, float shadowscale) { shaderstate.lightshadowmapinfo[0] = 1.0/texwidth; shaderstate.lightshadowmapinfo[1] = 1.0/texwidth; shaderstate.lightshadowmapinfo[2] = 1.0; shaderstate.lightshadowmapinfo[3] = shadowscale; shaderstate.curshadowmap = shadowmaptex; while(shaderstate.lastpasstmus>0) { GL_LazyBind(--shaderstate.lastpasstmus, 0, r_nulltex); } shaderstate.shaderbits &= ~SBITS_MISC_DEPTHWRITE; if (qglShadeModel) qglShadeModel(GL_FLAT); BE_SetPassBlendMode(0, PBM_REPLACE); GL_ForceDepthWritable(); // qglColorMask(GL_FALSE, GL_FALSE, GL_FALSE, GL_FALSE); BE_SelectMode(BEM_DEPTHONLY); } #endif static void T_Gen_CurrentRender(int tmu) { int vwidth, vheight; if (r_refdef.recurse) return; if (r_config.texture_non_power_of_two) { vwidth = vid.pixelwidth; vheight = vid.pixelheight; } else { vwidth = 1; vheight = 1; while (vwidth < vid.pixelwidth) { vwidth *= 2; } while (vheight < vid.pixelheight) { vheight *= 2; } } // copy the scene to texture if (!TEXVALID(shaderstate.temptexture)) TEXASSIGN(shaderstate.temptexture, GL_AllocNewTexture("***$currentrender***", vwidth, vheight, 0)); GL_MTBind(tmu, GL_TEXTURE_2D, shaderstate.temptexture); qglCopyTexImage2D(GL_TEXTURE_2D, 0, GL_RGB, 0, 0, vwidth, vheight, 0); qglTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_LINEAR); qglTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER, GL_LINEAR); qglTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE); qglTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_T, GL_CLAMP_TO_EDGE); } static void Shader_BindTextureForPass(int tmu, const shaderpass_t *pass) { extern texid_t missing_texture; extern texid_t missing_texture_gloss; extern texid_t scenepp_postproc_cube; extern texid_t r_whiteimage; texid_t t; switch(pass->texgen) { default: case T_GEN_SINGLEMAP: t = pass->anim_frames[0]; break; case T_GEN_ANIMMAP: t = pass->anim_frames[(int)(pass->anim_fps * shaderstate.curtime) % pass->anim_numframes]; break; case T_GEN_LIGHTMAP: if (shaderstate.curbatch->lightmap[0] < 0) t = r_whiteimage; else t = lightmap[shaderstate.curbatch->lightmap[0]]->lightmap_texture; break; case T_GEN_DELUXMAP: { int lmi = shaderstate.curbatch->lightmap[0]; if (lmi < 0 || !lightmap[lmi]->hasdeluxe) t = r_nulltex; //fixme else t = lightmap[lmi+1]->lightmap_texture; } break; case T_GEN_DIFFUSE: if (shaderstate.curtexnums && TEXVALID(shaderstate.curtexnums->base)) t = shaderstate.curtexnums->base; else t = missing_texture; break; case T_GEN_NORMALMAP: t = shaderstate.curtexnums?shaderstate.curtexnums->bump:r_nulltex; /*FIXME: nulltex is not correct*/ break; case T_GEN_SPECULAR: if (TEXVALID(shaderstate.curtexnums->specular)) t = shaderstate.curtexnums->specular; else t = missing_texture_gloss; break; case T_GEN_UPPEROVERLAY: t = shaderstate.curtexnums->upperoverlay; break; case T_GEN_LOWEROVERLAY: t = shaderstate.curtexnums->loweroverlay; break; case T_GEN_FULLBRIGHT: t = shaderstate.curtexnums->fullbright; break; case T_GEN_SHADOWMAP: t = shaderstate.curshadowmap; break; case T_GEN_LIGHTCUBEMAP: GL_LazyBind(tmu, GL_TEXTURE_CUBE_MAP_ARB, shaderstate.lightcubemap); return; case T_GEN_CUBEMAP: t = pass->anim_frames[0]; GL_LazyBind(tmu, GL_TEXTURE_CUBE_MAP_ARB, t); return; case T_GEN_SOURCECUBE: t = scenepp_postproc_cube; GL_LazyBind(tmu, GL_TEXTURE_CUBE_MAP_ARB, t); return; case T_GEN_3DMAP: t = pass->anim_frames[0]; GL_LazyBind(tmu, GL_TEXTURE_3D, t); return; case T_GEN_VIDEOMAP: #ifdef NOMEDIA t = shaderstate.curtexnums?shaderstate.curtexnums->base:r_nulltex; #else t = Media_UpdateForShader(pass->cin); #endif break; case T_GEN_CURRENTRENDER: T_Gen_CurrentRender(tmu); return; case T_GEN_SOURCECOLOUR: t = shaderstate.tex_sourcecol; break; case T_GEN_SOURCEDEPTH: t = shaderstate.tex_sourcedepth; break; case T_GEN_REFLECTION: t = shaderstate.tex_reflection; break; case T_GEN_REFRACTION: if (!r_refract_fboival) { T_Gen_CurrentRender(tmu); return; } t = shaderstate.tex_refraction; break; case T_GEN_REFRACTIONDEPTH: t = shaderstate.tex_refractiondepth; break; case T_GEN_RIPPLEMAP: t = shaderstate.tex_ripplemap; break; } GL_LazyBind(tmu, GL_TEXTURE_2D, t); } /*========================================== matrix functions =====================================*/ typedef vec3_t mat3_t[3]; static mat3_t axisDefault={{1, 0, 0}, {0, 1, 0}, {0, 0, 1}}; static void Matrix3_Transpose (mat3_t in, mat3_t out) { out[0][0] = in[0][0]; out[1][1] = in[1][1]; out[2][2] = in[2][2]; out[0][1] = in[1][0]; out[0][2] = in[2][0]; out[1][0] = in[0][1]; out[1][2] = in[2][1]; out[2][0] = in[0][2]; out[2][1] = in[1][2]; } static void Matrix3_Multiply_Vec3 (mat3_t a, vec3_t b, vec3_t product) { product[0] = a[0][0]*b[0] + a[0][1]*b[1] + a[0][2]*b[2]; product[1] = a[1][0]*b[0] + a[1][1]*b[1] + a[1][2]*b[2]; product[2] = a[2][0]*b[0] + a[2][1]*b[1] + a[2][2]*b[2]; } static int Matrix3_Compare(mat3_t in, mat3_t out) { return memcmp(in, out, sizeof(mat3_t)); } //end matrix functions /*========================================== tables for deforms =====================================*/ #define frand() (rand()*(1.0/RAND_MAX)) #define FTABLE_SIZE 1024 #define FTABLE_CLAMP(x) (((int)((x)*FTABLE_SIZE) & (FTABLE_SIZE-1))) #define FTABLE_EVALUATE(table,x) (table ? table[FTABLE_CLAMP(x)] : frand()*((x)-floor(x))) static float r_sintable[FTABLE_SIZE]; static float r_triangletable[FTABLE_SIZE]; static float r_squaretable[FTABLE_SIZE]; static float r_sawtoothtable[FTABLE_SIZE]; static float r_inversesawtoothtable[FTABLE_SIZE]; static float *FTableForFunc ( unsigned int func ) { switch (func) { case SHADER_FUNC_SIN: return r_sintable; case SHADER_FUNC_TRIANGLE: return r_triangletable; case SHADER_FUNC_SQUARE: return r_squaretable; case SHADER_FUNC_SAWTOOTH: return r_sawtoothtable; case SHADER_FUNC_INVERSESAWTOOTH: return r_inversesawtoothtable; } //bad values allow us to crash (so I can debug em) return NULL; } void Shader_LightPass(char *shortname, shader_t *s, const void *args) { char shadertext[8192*2]; sprintf(shadertext, LIGHTPASS_SHADER, ""); Shader_DefaultScript(shortname, s, shadertext); } void GenerateFogTexture(texid_t *tex, float density, float zscale) { #define FOGS 256 #define FOGT 32 byte_vec4_t fogdata[FOGS*FOGT]; int s, t; float f, z; static float fogdensity, fogzscale; if (TEXVALID(*tex) && density == fogdensity && zscale == fogzscale) return; fogdensity = density; fogzscale = zscale; for(s = 0; s < FOGS; s++) for(t = 0; t < FOGT; t++) { z = (float)s / (FOGS-1); z *= zscale; if (0)//q3 f = pow(z, 0.5); else if (1)//GL_EXP f = 1-exp(-density * z); else //GL_EXP2 f = 1-exp(-(density*density) * z); if (f < 0) f = 0; if (f > 1) f = 1; fogdata[t*FOGS + s][0] = 255; fogdata[t*FOGS + s][1] = 255; fogdata[t*FOGS + s][2] = 255; fogdata[t*FOGS + s][3] = 255*f; } if (!TEXVALID(*tex)) *tex = R_AllocNewTexture("***fog***", FOGS, FOGT, 0); R_Upload(*tex, "fog", TF_RGBA32, fogdata, NULL, FOGS, FOGT, IF_CLAMP|IF_NOMIPMAP); } void GLBE_Shutdown(void) { BZ_Free(shaderstate.wbatches); shaderstate.wbatches = NULL; shaderstate.maxwbatches = 0; } void GLBE_Init(void) { int i; double t; GLBE_Shutdown(); memset(&shaderstate, 0, sizeof(shaderstate)); shaderstate.curentity = &r_worldentity; be_maxpasses = gl_mtexarbable; gl_stencilbits = 0; if (gl_config.glversion >= 3.0 && gl_config.nofixedfunc) { //docs say this line should be okay in gl3+. nvidia do not seem to agree. GL_STENCIL_BITS is depricated however. so for now, just assume. //qglGetFramebufferAttachmentParameteriv(GL_FRAMEBUFFER_EXT, GL_STENCIL, GL_FRAMEBUFFER_ATTACHMENT_STENCIL_SIZE, &gl_stencilbits); gl_stencilbits = 8; } else qglGetIntegerv(GL_STENCIL_BITS, &gl_stencilbits); for (i = 0; i < FTABLE_SIZE; i++) { t = (double)i / (double)FTABLE_SIZE; r_sintable[i] = sin(t * 2*M_PI); if (t < 0.25) r_triangletable[i] = t * 4.0; else if (t < 0.75) r_triangletable[i] = 2 - 4.0 * t; else r_triangletable[i] = (t - 0.75) * 4.0 - 1.0; if (t < 0.5) r_squaretable[i] = 1.0f; else r_squaretable[i] = -1.0f; r_sawtoothtable[i] = t; r_inversesawtoothtable[i] = 1.0 - t; } shaderstate.identitylighting = 1; for (i = 0; i < MAXLIGHTMAPS; i++) shaderstate.dummybatch.lightmap[i] = -1; #ifdef RTLIGHTS if (r_shadow_realtime_dlight.ival || r_shadow_realtime_world.ival) { if (r_shadow_shadowmapping.ival) GLBE_RegisterLightShader(LSHADER_SMAP); else GLBE_RegisterLightShader(0); } #endif gl_overbright.modified = true; /*in case the d3d renderer does the same*/ /*lock the cvar down if the backend can't actually do it*/ if (!gl_config.tex_env_combine && !gl_config.nofixedfunc && gl_overbright.ival) Cvar_ApplyLatchFlag(&gl_overbright, "0", CVAR_RENDERERLATCH); shaderstate.shaderbits = ~SBITS_ATEST_BITS; BE_SendPassBlendDepthMask(0); currententity = &r_worldentity; shaderstate.fogtexture = r_nulltex; //make sure the world draws correctly r_worldentity.shaderRGBAf[0] = 1; r_worldentity.shaderRGBAf[1] = 1; r_worldentity.shaderRGBAf[2] = 1; r_worldentity.shaderRGBAf[3] = 1; r_worldentity.axis[0][0] = 1; r_worldentity.axis[1][1] = 1; r_worldentity.axis[2][2] = 1; r_worldentity.light_avg[0] = 1; r_worldentity.light_avg[1] = 1; r_worldentity.light_avg[2] = 1; R_InitFlashblends(); //only do this where we have to. if (qglBufferDataARB && gl_config.nofixedfunc) { memset(&shaderstate.streamvbo, 0, sizeof(shaderstate.streamvbo)); memset(&shaderstate.streamebo, 0, sizeof(shaderstate.streamebo)); memset(&shaderstate.streamvao, 0, sizeof(shaderstate.streamvao)); qglGenBuffersARB(sizeof(shaderstate.streamvbo)/sizeof(shaderstate.streamvbo[0]), shaderstate.streamvbo); qglGenBuffersARB(sizeof(shaderstate.streamebo)/sizeof(shaderstate.streamebo[0]), shaderstate.streamebo); if (qglGenVertexArrays) qglGenVertexArrays(sizeof(shaderstate.streamvao)/sizeof(shaderstate.streamvao[0]), shaderstate.streamvao); } } //end tables #define MAX_ARRAY_VERTS 65535 static avec4_t coloursarray[MAX_ARRAY_VERTS]; static float texcoordarray[SHADER_PASS_MAX][MAX_ARRAY_VERTS*2]; static vecV_t vertexarray[MAX_ARRAY_VERTS]; /*========================================== texture coord generation =====================================*/ static void tcgen_environment(float *st, unsigned int numverts, float *xyz, float *normal) { int i; vec3_t viewer, reflected; float d; vec3_t rorg; RotateLightVector(shaderstate.curentity->axis, shaderstate.curentity->origin, r_origin, rorg); for (i = 0 ; i < numverts ; i++, xyz += sizeof(vecV_t)/sizeof(vec_t), normal += 3, st += 2 ) { VectorSubtract (rorg, xyz, viewer); VectorNormalizeFast (viewer); d = DotProduct (normal, viewer); reflected[0] = normal[0]*2*d - viewer[0]; reflected[1] = normal[1]*2*d - viewer[1]; reflected[2] = normal[2]*2*d - viewer[2]; st[0] = 0.5 + reflected[1] * 0.5; st[1] = 0.5 - reflected[2] * 0.5; } } static void tcgen_fog(float *st, unsigned int numverts, float *xyz, mfog_t *fog) { int i; float z; vec4_t zmat; //generate a simple matrix to calc only the projected z coord zmat[0] = -shaderstate.modelviewmatrix[2]; zmat[1] = -shaderstate.modelviewmatrix[6]; zmat[2] = -shaderstate.modelviewmatrix[10]; zmat[3] = -shaderstate.modelviewmatrix[14]; Vector4Scale(zmat, shaderstate.fogfar, zmat); for (i = 0 ; i < numverts ; i++, xyz += sizeof(vecV_t)/sizeof(vec_t), st += 2 ) { z = DotProduct(xyz, zmat) + zmat[3]; st[0] = z; st[1] = realtime - (int)realtime; } } static float *tcgen(unsigned int tcgen, int cnt, float *dst, const mesh_t *mesh) { int i; vecV_t *src; switch (tcgen) { default: case TC_GEN_BASE: return (float*)mesh->st_array; case TC_GEN_LIGHTMAP: if (!mesh->lmst_array) return (float*)mesh->st_array; else return (float*)mesh->lmst_array; case TC_GEN_NORMAL: return (float*)mesh->normals_array; case TC_GEN_SVECTOR: return (float*)mesh->snormals_array; case TC_GEN_TVECTOR: return (float*)mesh->tnormals_array; case TC_GEN_ENVIRONMENT: if (!mesh->normals_array) return (float*)mesh->st_array; tcgen_environment(dst, cnt, (float*)mesh->xyz_array, (float*)mesh->normals_array); return dst; // case TC_GEN_DOTPRODUCT: // return mesh->st_array[0]; case TC_GEN_VECTOR: src = mesh->xyz_array; for (i = 0; i < cnt; i++, dst += 2) { static vec3_t tc_gen_s = { 1.0f, 0.0f, 0.0f }; static vec3_t tc_gen_t = { 0.0f, 1.0f, 0.0f }; dst[0] = DotProduct(tc_gen_s, src[i]); dst[1] = DotProduct(tc_gen_t, src[i]); } return dst; } } /*src and dst can be the same address when tcmods are chained*/ static void tcmod(const tcmod_t *tcmod, int cnt, const float *src, float *dst, const mesh_t *mesh) { float *table; float t1, t2; float cost, sint; int j; #define R_FastSin(x) sin((x)*(2*M_PI)) switch (tcmod->type) { case SHADER_TCMOD_ROTATE: cost = tcmod->args[0] * shaderstate.curtime; sint = R_FastSin(cost); cost = R_FastSin(cost + 0.25); for (j = 0; j < cnt; j++, dst+=2,src+=2) { t1 = cost * (src[0] - 0.5f) - sint * (src[1] - 0.5f) + 0.5f; t2 = cost * (src[1] - 0.5f) + sint * (src[0] - 0.5f) + 0.5f; dst[0] = t1; dst[1] = t2; } break; case SHADER_TCMOD_SCALE: t1 = tcmod->args[0]; t2 = tcmod->args[1]; for (j = 0; j < cnt; j++, dst+=2,src+=2) { dst[0] = src[0] * t1; dst[1] = src[1] * t2; } break; case SHADER_TCMOD_TURB: t1 = tcmod->args[2] + shaderstate.curtime * tcmod->args[3]; t2 = tcmod->args[1]; for (j = 0; j < cnt; j++, dst+=2,src+=2) { dst[0] = src[0] + R_FastSin (src[0]*t2+t1) * t2; dst[1] = src[1] + R_FastSin (src[1]*t2+t1) * t2; } break; case SHADER_TCMOD_STRETCH: table = FTableForFunc(tcmod->args[0]); t2 = tcmod->args[3] + shaderstate.curtime * tcmod->args[4]; t1 = FTABLE_EVALUATE(table, t2) * tcmod->args[2] + tcmod->args[1]; t1 = t1 ? 1.0f / t1 : 1.0f; t2 = 0.5f - 0.5f * t1; for (j = 0; j < cnt; j++, dst+=2,src+=2) { dst[0] = src[0] * t1 + t2; dst[1] = src[1] * t1 + t2; } break; case SHADER_TCMOD_SCROLL: t1 = tcmod->args[0] * shaderstate.curtime; t2 = tcmod->args[1] * shaderstate.curtime; for (j = 0; j < cnt; j++, dst += 2, src+=2) { dst[0] = src[0] + t1; dst[1] = src[1] + t2; } break; case SHADER_TCMOD_TRANSFORM: for (j = 0; j < cnt; j++, dst+=2, src+=2) { t1 = src[0]; t2 = src[1]; dst[0] = t1 * tcmod->args[0] + t2 * tcmod->args[2] + tcmod->args[4]; dst[1] = t2 * tcmod->args[1] + t1 * tcmod->args[3] + tcmod->args[5]; } break; default: break; } } static void GenerateTCFog(int passnum, mfog_t *fog) { int m; mesh_t *mesh; for (m = 0; m < shaderstate.meshcount; m++) { mesh = shaderstate.meshes[m]; tcgen_fog(texcoordarray[passnum]+mesh->vbofirstvert*2, mesh->numvertexes, (float*)mesh->xyz_array, fog); } shaderstate.pendingtexcoordparts[passnum] = 2; shaderstate.pendingtexcoordvbo[passnum] = 0; shaderstate.pendingtexcoordpointer[passnum] = texcoordarray[passnum]; } static void GenerateTCMods(const shaderpass_t *pass, int passnum) { #if 1 int i, m; float *src; mesh_t *mesh; for (m = 0; m < shaderstate.meshcount; m++) { mesh = shaderstate.meshes[m]; src = tcgen(pass->tcgen, mesh->numvertexes, texcoordarray[passnum]+mesh->vbofirstvert*2, mesh); //tcgen might return unmodified info if (pass->numtcmods) { tcmod(&pass->tcmods[0], mesh->numvertexes, src, texcoordarray[passnum]+mesh->vbofirstvert*2, mesh); for (i = 1; i < pass->numtcmods; i++) { tcmod(&pass->tcmods[i], mesh->numvertexes, texcoordarray[passnum]+mesh->vbofirstvert*2, texcoordarray[passnum]+mesh->vbofirstvert*2, mesh); } src = texcoordarray[passnum]+mesh->vbofirstvert*2; } else if (src != texcoordarray[passnum]+mesh->vbofirstvert*2) { //this shouldn't actually ever be true memcpy(texcoordarray[passnum]+mesh->vbofirstvert*2, src, 8*mesh->numvertexes); } } shaderstate.pendingtexcoordparts[passnum] = 2; shaderstate.pendingtexcoordvbo[passnum] = 0; shaderstate.pendingtexcoordpointer[passnum] = texcoordarray[passnum]; #else GL_DeselectVAO(); if (!shaderstate.vbo_texcoords[passnum]) { shaderstate.vbo_texcoords[passnum] = 0; qglGenBuffersARB(1, &shaderstate.vbo_texcoords[passnum]); } GL_SelectVBO(shaderstate.vbo_texcoords[passnum]); { qglBufferDataARB(GL_ARRAY_BUFFER_ARB, MAX_ARRAY_VERTS*sizeof(float)*2, NULL, GL_STREAM_DRAW_ARB); for (; meshlist; meshlist = meshlist->next) { int i; float *src; src = tcgen(pass, meshlist->numvertexes, texcoordarray[passnum], meshlist); //tcgen might return unmodified info if (pass->numtcmods) { tcmod(&pass->tcmods[0], meshlist->numvertexes, src, texcoordarray[passnum], meshlist); for (i = 1; i < pass->numtcmods; i++) { tcmod(&pass->tcmods[i], meshlist->numvertexes, texcoordarray[passnum], texcoordarray[passnum], meshlist); } src = texcoordarray[passnum]; } qglBufferSubDataARB(GL_ARRAY_BUFFER_ARB, meshlist->vbofirstvert*8, meshlist->numvertexes*8, src); } } shaderstate.pendingtexcoordparts[passnum] = 2; shaderstate.pendingtexcoordvbo[passnum] = shaderstate.vbo_texcoords[passnum]; shaderstate.pendingtexcoordpointer[passnum] = NULL; #endif } //end texture coords /*========================================== colour generation =====================================*/ //source is always packed //dest is packed too static void colourgen(const shaderpass_t *pass, int cnt, vec4_t *src, vec4_t *dst, const mesh_t *mesh) { switch (pass->rgbgen) { case RGB_GEN_ENTITY: while((cnt)--) { dst[cnt][0] = shaderstate.curentity->shaderRGBAf[0]; dst[cnt][1] = shaderstate.curentity->shaderRGBAf[1]; dst[cnt][2] = shaderstate.curentity->shaderRGBAf[2]; } break; case RGB_GEN_ONE_MINUS_ENTITY: while((cnt)--) { dst[cnt][0] = 1-shaderstate.curentity->shaderRGBAf[0]; dst[cnt][1] = 1-shaderstate.curentity->shaderRGBAf[1]; dst[cnt][2] = 1-shaderstate.curentity->shaderRGBAf[2]; } break; case RGB_GEN_VERTEX_LIGHTING: if (shaderstate.identitylighting != 1) { if (!src) { while((cnt)--) { dst[cnt][0] = shaderstate.identitylighting; dst[cnt][1] = shaderstate.identitylighting; dst[cnt][2] = shaderstate.identitylighting; } break; } while((cnt)--) { dst[cnt][0] = src[cnt][0]*shaderstate.identitylighting; dst[cnt][1] = src[cnt][1]*shaderstate.identitylighting; dst[cnt][2] = src[cnt][2]*shaderstate.identitylighting; } break; } case RGB_GEN_VERTEX_EXACT: if (!src) { while((cnt)--) { dst[cnt][0] = 1; dst[cnt][1] = 1; dst[cnt][2] = 1; } break; } while((cnt)--) { dst[cnt][0] = src[cnt][0]; dst[cnt][1] = src[cnt][1]; dst[cnt][2] = src[cnt][2]; } break; case RGB_GEN_ONE_MINUS_VERTEX: while((cnt)--) { dst[cnt][0] = 1-src[cnt][0]; dst[cnt][1] = 1-src[cnt][1]; dst[cnt][2] = 1-src[cnt][2]; } break; case RGB_GEN_IDENTITY_LIGHTING: if (shaderstate.curbatch->lightstyle[0] != 255) { while((cnt)--) { dst[cnt][0] = shaderstate.identitylighting * d_lightstylevalue[shaderstate.curbatch->lightstyle[0]]/256.0f; dst[cnt][1] = shaderstate.identitylighting * d_lightstylevalue[shaderstate.curbatch->lightstyle[0]]/256.0f; dst[cnt][2] = shaderstate.identitylighting * d_lightstylevalue[shaderstate.curbatch->lightstyle[0]]/256.0f; } } else { //compensate for overbrights while((cnt)--) { dst[cnt][0] = shaderstate.identitylighting; dst[cnt][1] = shaderstate.identitylighting; dst[cnt][2] = shaderstate.identitylighting; } } break; default: case RGB_GEN_IDENTITY: while((cnt)--) { dst[cnt][0] = 1; dst[cnt][1] = 1; dst[cnt][2] = 1; } break; case RGB_GEN_CONST: while((cnt)--) { dst[cnt][0] = pass->rgbgen_func.args[0]; dst[cnt][1] = pass->rgbgen_func.args[1]; dst[cnt][2] = pass->rgbgen_func.args[2]; } break; case RGB_GEN_LIGHTING_DIFFUSE: //collect lighting details for mobile entities if (!mesh->normals_array) { while((cnt)--) { dst[cnt][0] = 1; dst[cnt][1] = 1; dst[cnt][2] = 1; } } else { R_LightArrays(shaderstate.curentity, mesh->xyz_array, dst, cnt, mesh->normals_array, shaderstate.identitylighting); } break; case RGB_GEN_WAVE: { float *table; float c; table = FTableForFunc(pass->rgbgen_func.type); c = pass->rgbgen_func.args[2] + shaderstate.curtime * pass->rgbgen_func.args[3]; c = FTABLE_EVALUATE(table, c) * pass->rgbgen_func.args[1] + pass->rgbgen_func.args[0]; c = bound(0.0f, c, 1.0f); while((cnt)--) { dst[cnt][0] = c; dst[cnt][1] = c; dst[cnt][2] = c; } } break; case RGB_GEN_TOPCOLOR: if (cnt) { int r, g, b; R_FetchTopColour(&r, &g, &b); dst[0][0] = r/255.0f; dst[0][1] = g/255.0f; dst[0][2] = b/255.0f; while((cnt)--) { dst[cnt][0] = dst[0][0]; dst[cnt][1] = dst[0][1]; dst[cnt][2] = dst[0][2]; } } break; case RGB_GEN_BOTTOMCOLOR: if (cnt) { int r, g, b; R_FetchBottomColour(&r, &g, &b); dst[0][0] = r/255.0f; dst[0][1] = g/255.0f; dst[0][2] = b/255.0f; while((cnt)--) { dst[cnt][0] = dst[0][0]; dst[cnt][1] = dst[0][1]; dst[cnt][2] = dst[0][2]; } } break; } } static void deformgen(const deformv_t *deformv, int cnt, vecV_t *src, vecV_t *dst, const mesh_t *mesh) { float *table; int j, k; float args[4]; float deflect; switch (deformv->type) { default: case DEFORMV_NONE: if (src != dst) memcpy(dst, src, sizeof(*src)*cnt); break; case DEFORMV_WAVE: if (!mesh->normals_array) { if (src != dst) memcpy(dst, src, sizeof(*src)*cnt); return; } args[0] = deformv->func.args[0]; args[1] = deformv->func.args[1]; args[3] = deformv->func.args[2] + deformv->func.args[3] * shaderstate.curtime; table = FTableForFunc(deformv->func.type); for ( j = 0; j < cnt; j++ ) { deflect = deformv->args[0] * (src[j][0]+src[j][1]+src[j][2]) + args[3]; deflect = FTABLE_EVALUATE(table, deflect) * args[1] + args[0]; // Deflect vertex along its normal by wave amount VectorMA(src[j], deflect, mesh->normals_array[j], dst[j]); } break; case DEFORMV_NORMAL: //normal does not actually move the verts, but it does change the normals array //we don't currently support that. if (src != dst) memcpy(dst, src, sizeof(*src)*cnt); /* args[0] = deformv->args[1] * shaderstate.curtime; for ( j = 0; j < cnt; j++ ) { args[1] = normalsArray[j][2] * args[0]; deflect = deformv->args[0] * R_FastSin(args[1]); normalsArray[j][0] *= deflect; deflect = deformv->args[0] * R_FastSin(args[1] + 0.25); normalsArray[j][1] *= deflect; VectorNormalizeFast(normalsArray[j]); } */ break; case DEFORMV_MOVE: table = FTableForFunc(deformv->func.type); deflect = deformv->func.args[2] + shaderstate.curtime * deformv->func.args[3]; deflect = FTABLE_EVALUATE(table, deflect) * deformv->func.args[1] + deformv->func.args[0]; for ( j = 0; j < cnt; j++ ) VectorMA(src[j], deflect, deformv->args, dst[j]); break; case DEFORMV_BULGE: args[0] = deformv->args[0]/(2*M_PI); args[1] = deformv->args[1]; args[2] = shaderstate.curtime * deformv->args[2]/(2*M_PI); for (j = 0; j < cnt; j++) { deflect = R_FastSin(mesh->st_array[j][0]*args[0] + args[2])*args[1]; dst[j][0] = src[j][0]+deflect*mesh->normals_array[j][0]; dst[j][1] = src[j][1]+deflect*mesh->normals_array[j][1]; dst[j][2] = src[j][2]+deflect*mesh->normals_array[j][2]; } break; case DEFORMV_AUTOSPRITE: if (mesh->numindexes < 6) break; for (j = 0; j < cnt-3; j+=4, src+=4, dst+=4) { vec3_t mid, d; float radius; mid[0] = 0.25*(src[0][0] + src[1][0] + src[2][0] + src[3][0]); mid[1] = 0.25*(src[0][1] + src[1][1] + src[2][1] + src[3][1]); mid[2] = 0.25*(src[0][2] + src[1][2] + src[2][2] + src[3][2]); VectorSubtract(src[0], mid, d); radius = 2*VectorLength(d); for (k = 0; k < 4; k++) { dst[k][0] = mid[0] + radius*((mesh->st_array[k][0]-0.5)*r_refdef.m_view[0+0]-(mesh->st_array[k][1]-0.5)*r_refdef.m_view[0+1]); dst[k][1] = mid[1] + radius*((mesh->st_array[k][0]-0.5)*r_refdef.m_view[4+0]-(mesh->st_array[k][1]-0.5)*r_refdef.m_view[4+1]); dst[k][2] = mid[2] + radius*((mesh->st_array[k][0]-0.5)*r_refdef.m_view[8+0]-(mesh->st_array[k][1]-0.5)*r_refdef.m_view[8+1]); } } break; case DEFORMV_AUTOSPRITE2: if (mesh->numindexes < 6) break; for (k = 0; k < mesh->numindexes; k += 6) { int long_axis, short_axis; vec3_t axis; float len[3]; mat3_t m0, m1, m2, result; float *quad[4]; vec3_t rot_centre, tv; quad[0] = (float *)(dst + mesh->indexes[k+0]); quad[1] = (float *)(dst + mesh->indexes[k+1]); quad[2] = (float *)(dst + mesh->indexes[k+2]); for (j = 2; j >= 0; j--) { quad[3] = (float *)(dst + mesh->indexes[k+3+j]); if (!VectorEquals (quad[3], quad[0]) && !VectorEquals (quad[3], quad[1]) && !VectorEquals (quad[3], quad[2])) { break; } } // build a matrix were the longest axis of the billboard is the Y-Axis VectorSubtract(quad[1], quad[0], m0[0]); VectorSubtract(quad[2], quad[0], m0[1]); VectorSubtract(quad[2], quad[1], m0[2]); len[0] = DotProduct(m0[0], m0[0]); len[1] = DotProduct(m0[1], m0[1]); len[2] = DotProduct(m0[2], m0[2]); if ((len[2] > len[1]) && (len[2] > len[0])) { if (len[1] > len[0]) { long_axis = 1; short_axis = 0; } else { long_axis = 0; short_axis = 1; } } else if ((len[1] > len[2]) && (len[1] > len[0])) { if (len[2] > len[0]) { long_axis = 2; short_axis = 0; } else { long_axis = 0; short_axis = 2; } } else //if ( (len[0] > len[1]) && (len[0] > len[2]) ) { if (len[2] > len[1]) { long_axis = 2; short_axis = 1; } else { long_axis = 1; short_axis = 2; } } if (DotProduct(m0[long_axis], m0[short_axis])) { VectorNormalize2(m0[long_axis], axis); VectorCopy(axis, m0[1]); if (axis[0] || axis[1]) { VectorVectors(m0[1], m0[2], m0[0]); } else { VectorVectors(m0[1], m0[0], m0[2]); } } else { VectorNormalize2(m0[long_axis], axis); VectorNormalize2(m0[short_axis], m0[0]); VectorCopy(axis, m0[1]); CrossProduct(m0[0], m0[1], m0[2]); } for (j = 0; j < 3; j++) rot_centre[j] = (quad[0][j] + quad[1][j] + quad[2][j] + quad[3][j]) * 0.25; if (shaderstate.curentity) { VectorAdd(shaderstate.curentity->origin, rot_centre, tv); } else { VectorCopy(rot_centre, tv); } VectorSubtract(r_origin, tv, tv); // filter any longest-axis-parts off the camera-direction deflect = -DotProduct(tv, axis); VectorMA(tv, deflect, axis, m1[2]); VectorNormalizeFast(m1[2]); VectorCopy(axis, m1[1]); CrossProduct(m1[1], m1[2], m1[0]); Matrix3_Transpose(m1, m2); Matrix3_Multiply(m2, m0, result); for (j = 0; j < 4; j++) { VectorSubtract(quad[j], rot_centre, tv); Matrix3_Multiply_Vec3(result, tv, quad[j]); VectorAdd(rot_centre, quad[j], quad[j]); } } break; // case DEFORMV_PROJECTION_SHADOW: // break; } } static void GenerateVertexBlends(const shader_t *shader) { int i, m; mesh_t *meshlist; vecV_t *ov, *iv1, *iv2; float w1, w2; for (m = 0; m < shaderstate.meshcount; m++) { meshlist = shaderstate.meshes[m]; ov = vertexarray+meshlist->vbofirstvert; iv1 = meshlist->xyz_array; iv2 = meshlist->xyz2_array; w1 = meshlist->xyz_blendw[0]; w2 = meshlist->xyz_blendw[1]; for (i = 0; i < meshlist->numvertexes; i++) { ov[i][0] = iv1[i][0]*w1 + iv2[i][0]*w2; ov[i][1] = iv1[i][1]*w1 + iv2[i][1]*w2; ov[i][2] = iv1[i][2]*w1 + iv2[i][2]*w2; } for (i = 0; i < shader->numdeforms; i++) { deformgen(&shader->deforms[i], meshlist->numvertexes, vertexarray+meshlist->vbofirstvert, vertexarray+meshlist->vbofirstvert, meshlist); } } shaderstate.pendingvertexpointer = vertexarray; shaderstate.pendingvertexvbo = 0; } static void GenerateVertexDeforms(const shader_t *shader) { int i, m; mesh_t *meshlist; for (m = 0; m < shaderstate.meshcount; m++) { meshlist = shaderstate.meshes[m]; deformgen(&shader->deforms[0], meshlist->numvertexes, meshlist->xyz_array, vertexarray+meshlist->vbofirstvert, meshlist); for (i = 1; i < shader->numdeforms; i++) { deformgen(&shader->deforms[i], meshlist->numvertexes, vertexarray+meshlist->vbofirstvert, vertexarray+meshlist->vbofirstvert, meshlist); } } shaderstate.pendingvertexpointer = vertexarray; shaderstate.pendingvertexvbo = 0; } /*======================================alpha ===============================*/ static void alphagen(const shaderpass_t *pass, int cnt, avec4_t *const src, avec4_t *dst, const mesh_t *mesh) { float *table; float t; float f; vec3_t v1, v2; int i; switch (pass->alphagen) { default: case ALPHA_GEN_IDENTITY: if (shaderstate.flags & BEF_FORCETRANSPARENT) { while(cnt--) dst[cnt][3] = shaderstate.curentity->shaderRGBAf[3]; } else { while(cnt--) dst[cnt][3] = 1; } break; case ALPHA_GEN_CONST: t = pass->alphagen_func.args[0]; while(cnt--) dst[cnt][3] = t; break; case ALPHA_GEN_WAVE: table = FTableForFunc(pass->alphagen_func.type); f = pass->alphagen_func.args[2] + shaderstate.curtime * pass->alphagen_func.args[3]; f = FTABLE_EVALUATE(table, f) * pass->alphagen_func.args[1] + pass->alphagen_func.args[0]; t = bound(0.0f, f, 1.0f); while(cnt--) dst[cnt][3] = t; break; case ALPHA_GEN_PORTAL: //FIXME: should this be per-vert? if (r_refdef.recurse) f = 1; else { VectorAdd(mesh->xyz_array[0], shaderstate.curentity->origin, v1); VectorSubtract(r_origin, v1, v2); f = VectorLength(v2) * (1.0 / shaderstate.curshader->portaldist); f = bound(0.0f, f, 1.0f); } while(cnt--) dst[cnt][3] = f; break; case ALPHA_GEN_VERTEX: if (!src) { while(cnt--) { dst[cnt][3] = 1; } break; } while(cnt--) { dst[cnt][3] = src[cnt][3]; } break; case ALPHA_GEN_ENTITY: f = bound(0, shaderstate.curentity->shaderRGBAf[3], 1); while(cnt--) { dst[cnt][3] = f; } break; case ALPHA_GEN_SPECULAR: { mat3_t axis; AngleVectors(shaderstate.curentity->angles, axis[0], axis[1], axis[2]); VectorSubtract(r_origin, shaderstate.curentity->origin, v1); if (!Matrix3_Compare(axis, axisDefault)) { Matrix3_Multiply_Vec3(axis, v1, v2); } else { VectorCopy(v1, v2); } for (i = 0; i < cnt; i++) { VectorSubtract(v2, mesh->xyz_array[i], v1); f = DotProduct(v1, mesh->normals_array[i] ) * Q_rsqrt(DotProduct(v1,v1)); f = f * f * f * f * f; dst[i][3] = bound (0.0f, f, 1.0f); } } break; } } static void GenerateColourMods(const shaderpass_t *pass) { unsigned int m; mesh_t *meshlist; meshlist = shaderstate.meshes[0]; if (pass->flags & SHADER_PASS_NOCOLORARRAY && qglColor4fv) { colourgen(pass, 1, meshlist->colors4f_array, &shaderstate.pendingcolourflat, meshlist); alphagen(pass, 1, meshlist->colors4f_array, &shaderstate.pendingcolourflat, meshlist); shaderstate.pendingcolourvbo = 0; shaderstate.pendingcolourpointer = NULL; } else { extern cvar_t r_nolightdir; if (pass->rgbgen == RGB_GEN_LIGHTING_DIFFUSE) { if (shaderstate.mode == BEM_DEPTHDARK || shaderstate.mode == BEM_DEPTHONLY) { shaderstate.pendingcolourflat[0] = shaderstate.pendingcolourflat[1] = shaderstate.pendingcolourflat[2] = 0; alphagen(pass, 1, meshlist->colors4f_array, &shaderstate.pendingcolourflat, meshlist); shaderstate.pendingcolourvbo = 0; shaderstate.pendingcolourpointer = NULL; return; } if (shaderstate.mode == BEM_LIGHT) { shaderstate.pendingcolourflat[0] = shaderstate.pendingcolourflat[1] = shaderstate.pendingcolourflat[2] = 1; alphagen(pass, 1, meshlist->colors4f_array, &shaderstate.pendingcolourflat, meshlist); shaderstate.pendingcolourvbo = 0; shaderstate.pendingcolourpointer = NULL; return; } if (r_nolightdir.ival) { VectorCopy(shaderstate.curentity->light_avg, shaderstate.pendingcolourflat); shaderstate.pendingcolourflat[3] = shaderstate.curentity->shaderRGBAf[3]; shaderstate.pendingcolourvbo = 0; shaderstate.pendingcolourpointer = NULL; return; } } //if its vetex lighting, just use the vbo if (((pass->rgbgen == RGB_GEN_VERTEX_LIGHTING && shaderstate.identitylighting == 1) || pass->rgbgen == RGB_GEN_VERTEX_EXACT) && pass->alphagen == ALPHA_GEN_VERTEX) { shaderstate.pendingcolourvbo = shaderstate.sourcevbo->colours.gl.vbo; shaderstate.pendingcolourpointer = shaderstate.sourcevbo->colours.gl.addr; return; } for (m = 0; m < shaderstate.meshcount; m++) { meshlist = shaderstate.meshes[m]; colourgen(pass, meshlist->numvertexes, meshlist->colors4f_array, coloursarray + meshlist->vbofirstvert, meshlist); alphagen(pass, meshlist->numvertexes, meshlist->colors4f_array, coloursarray + meshlist->vbofirstvert, meshlist); } shaderstate.colourarraytype = GL_FLOAT; shaderstate.pendingcolourvbo = 0; shaderstate.pendingcolourpointer = coloursarray; } } static void BE_GeneratePassTC(const shaderpass_t *pass, int tmu) { if (!pass->numtcmods) { //if there are no tcmods, pass through here as fast as possible if (pass->tcgen == TC_GEN_BASE) { shaderstate.pendingtexcoordparts[tmu] = 2; shaderstate.pendingtexcoordvbo[tmu] = shaderstate.sourcevbo->texcoord.gl.vbo; shaderstate.pendingtexcoordpointer[tmu] = shaderstate.sourcevbo->texcoord.gl.addr; } else if (pass->tcgen == TC_GEN_LIGHTMAP) { if (!shaderstate.sourcevbo->lmcoord[0].gl.addr) { shaderstate.pendingtexcoordparts[tmu] = 2; shaderstate.pendingtexcoordvbo[tmu] = shaderstate.sourcevbo->texcoord.gl.vbo; shaderstate.pendingtexcoordpointer[tmu] = shaderstate.sourcevbo->texcoord.gl.addr; } else { shaderstate.pendingtexcoordparts[tmu] = 2; shaderstate.pendingtexcoordvbo[tmu] = shaderstate.sourcevbo->lmcoord[0].gl.vbo; shaderstate.pendingtexcoordpointer[tmu] = shaderstate.sourcevbo->lmcoord[0].gl.addr; } } else if (pass->tcgen == TC_GEN_NORMAL) { shaderstate.pendingtexcoordparts[tmu] = 3; shaderstate.pendingtexcoordvbo[tmu] = shaderstate.sourcevbo->normals.gl.vbo; shaderstate.pendingtexcoordpointer[tmu] = shaderstate.sourcevbo->normals.gl.addr; } else if (pass->tcgen == TC_GEN_SVECTOR) { shaderstate.pendingtexcoordparts[tmu] = 3; shaderstate.pendingtexcoordvbo[tmu] = shaderstate.sourcevbo->svector.gl.vbo; shaderstate.pendingtexcoordpointer[tmu] = shaderstate.sourcevbo->svector.gl.addr; } else if (pass->tcgen == TC_GEN_TVECTOR) { shaderstate.pendingtexcoordparts[tmu] = 3; shaderstate.pendingtexcoordvbo[tmu] = shaderstate.sourcevbo->tvector.gl.vbo; shaderstate.pendingtexcoordpointer[tmu] = shaderstate.sourcevbo->tvector.gl.addr; } else { //specular highlights and reflections have no fixed data, and must be generated. GenerateTCMods(pass, tmu); } } else { GenerateTCMods(pass, tmu); } } static void BE_SendPassBlendDepthMask(unsigned int sbits) { unsigned int delta; /*2d mode doesn't depth test or depth write*/ if (shaderstate.force2d) { #ifdef warningmsg #pragma warningmsg("fixme: q3 doesn't seem to have this, why do we need it?") #endif sbits &= ~(SBITS_MISC_DEPTHWRITE|SBITS_MISC_DEPTHEQUALONLY); sbits |= SBITS_MISC_NODEPTHTEST; } if (shaderstate.flags & (BEF_FORCEADDITIVE|BEF_FORCETRANSPARENT|BEF_FORCENODEPTH|BEF_FORCEDEPTHTEST|BEF_FORCEDEPTHWRITE)) { if (shaderstate.flags & BEF_FORCEADDITIVE) sbits = (sbits & ~(SBITS_MISC_DEPTHWRITE|SBITS_BLEND_BITS|SBITS_ATEST_BITS)) | (SBITS_SRCBLEND_SRC_ALPHA | SBITS_DSTBLEND_ONE); else if (shaderstate.flags & BEF_FORCETRANSPARENT) { if ((sbits & SBITS_BLEND_BITS) == (SBITS_SRCBLEND_ONE| SBITS_DSTBLEND_ZERO) || !(sbits & SBITS_BLEND_BITS)) /*if transparency is forced, clear alpha test bits*/ sbits = (sbits & ~(SBITS_BLEND_BITS|SBITS_ATEST_BITS)) | (SBITS_SRCBLEND_SRC_ALPHA | SBITS_DSTBLEND_ONE_MINUS_SRC_ALPHA | SBITS_ATEST_GT0); } if (shaderstate.flags & BEF_FORCENODEPTH) /*EF_NODEPTHTEST dp extension*/ sbits |= SBITS_MISC_NODEPTHTEST; else { if (shaderstate.flags & BEF_FORCEDEPTHTEST) sbits &= ~SBITS_MISC_NODEPTHTEST; if (shaderstate.flags & BEF_FORCEDEPTHWRITE) sbits |= SBITS_MISC_DEPTHWRITE; } } delta = sbits^shaderstate.shaderbits; #ifdef FORCESTATE delta |= ~0; #endif if (!delta) return; shaderstate.shaderbits = sbits; if (delta & SBITS_BLEND_BITS) { if (sbits & SBITS_BLEND_BITS) { int src, dst; /*unpack the src and dst factors*/ switch(sbits & SBITS_SRCBLEND_BITS) { case SBITS_SRCBLEND_ZERO: src = GL_ZERO; break; default: case SBITS_SRCBLEND_ONE: src = GL_ONE; break; case SBITS_SRCBLEND_DST_COLOR: src = GL_DST_COLOR; break; case SBITS_SRCBLEND_ONE_MINUS_DST_COLOR: src = GL_ONE_MINUS_DST_COLOR; break; case SBITS_SRCBLEND_SRC_ALPHA: src = GL_SRC_ALPHA; break; case SBITS_SRCBLEND_ONE_MINUS_SRC_ALPHA: src = GL_ONE_MINUS_SRC_ALPHA; break; case SBITS_SRCBLEND_DST_ALPHA: src = GL_DST_ALPHA; break; case SBITS_SRCBLEND_ONE_MINUS_DST_ALPHA: src = GL_ONE_MINUS_DST_ALPHA; break; case SBITS_SRCBLEND_ALPHA_SATURATE: src = GL_SRC_ALPHA_SATURATE; break; } switch((sbits & SBITS_DSTBLEND_BITS)>>4) { case SBITS_DSTBLEND_ZERO>>4: dst = GL_ZERO; break; default: case SBITS_DSTBLEND_ONE>>4: dst = GL_ONE; break; case SBITS_DSTBLEND_SRC_COLOR>>4: dst = GL_SRC_COLOR; break; case SBITS_DSTBLEND_ONE_MINUS_SRC_COLOR>>4: dst = GL_ONE_MINUS_SRC_COLOR; break; case SBITS_DSTBLEND_SRC_ALPHA>>4: dst = GL_SRC_ALPHA; break; case SBITS_DSTBLEND_ONE_MINUS_SRC_ALPHA>>4: dst = GL_ONE_MINUS_SRC_ALPHA; break; case SBITS_DSTBLEND_DST_ALPHA>>4: dst = GL_DST_ALPHA; break; case SBITS_DSTBLEND_ONE_MINUS_DST_ALPHA>>4: dst = GL_ONE_MINUS_DST_ALPHA; break; } qglEnable(GL_BLEND); qglBlendFunc(src, dst); } else qglDisable(GL_BLEND); } #ifdef GL_ALPHA_TEST //alpha test doesn't exist in gles2 if ((delta & SBITS_ATEST_BITS) && !gl_config.nofixedfunc) { switch (sbits & SBITS_ATEST_BITS) { default: qglDisable(GL_ALPHA_TEST); break; case SBITS_ATEST_GT0: qglEnable(GL_ALPHA_TEST); qglAlphaFunc(GL_GREATER, 0); break; case SBITS_ATEST_LT128: qglEnable(GL_ALPHA_TEST); qglAlphaFunc(GL_LESS, 0.5f); break; case SBITS_ATEST_GE128: qglEnable(GL_ALPHA_TEST); qglAlphaFunc(GL_GEQUAL, 0.5f); break; } } #endif if (delta & SBITS_MISC_NODEPTHTEST) { if (sbits & SBITS_MISC_NODEPTHTEST) qglDisable(GL_DEPTH_TEST); else qglEnable(GL_DEPTH_TEST); } if (delta & SBITS_MISC_DEPTHWRITE) { if (sbits & SBITS_MISC_DEPTHWRITE) qglDepthMask(GL_TRUE); else qglDepthMask(GL_FALSE); } if (delta & (SBITS_MISC_DEPTHEQUALONLY|SBITS_MISC_DEPTHCLOSERONLY)) { extern int gldepthfunc; switch (sbits & (SBITS_MISC_DEPTHEQUALONLY|SBITS_MISC_DEPTHCLOSERONLY)) { case SBITS_MISC_DEPTHEQUALONLY: qglDepthFunc(GL_EQUAL); break; case SBITS_MISC_DEPTHCLOSERONLY: if (gldepthfunc == GL_LEQUAL) qglDepthFunc(GL_LESS); else qglDepthFunc(GL_GREATER); break; default: qglDepthFunc(gldepthfunc); break; } } if (delta & (SBITS_MASK_BITS)) { qglColorMask( (sbits&SBITS_MASK_RED)?GL_FALSE:GL_TRUE, (sbits&SBITS_MASK_GREEN)?GL_FALSE:GL_TRUE, (sbits&SBITS_MASK_BLUE)?GL_FALSE:GL_TRUE, (sbits&SBITS_MASK_ALPHA)?GL_FALSE:GL_TRUE ); } if ((delta & SBITS_TRUFORM) && qglPNTrianglesiATI) { if ((sbits & SBITS_TRUFORM) && gl_ati_truform.ival) qglEnable(GL_PN_TRIANGLES_ATI); else qglDisable(GL_PN_TRIANGLES_ATI); } } static void BE_SubmitMeshChain(void) { int startv, starti, endv, endi; int m; mesh_t *mesh; int batchtype = GL_TRIANGLES; if (shaderstate.flags & BEF_LINES) batchtype = GL_LINES; #if 0 if (!shaderstate.currentebo) { if (shaderstate.meshcount == 1) { mesh = shaderstate.meshes[0]; qglDrawRangeElements(batchtype, mesh->vbofirstvert, mesh->vbofirstvert+mesh->numvertexes, mesh->numindexes, GL_INDEX_TYPE, shaderstate.sourcevbo->indicies + mesh->vbofirstelement); RQuantAdd(RQUANT_DRAWS, 1); return; } else { index_t *ilst; mesh = shaderstate.meshes[0]; startv = mesh->vbofirstvert; endv = startv + mesh->numvertexes; endi = mesh->numindexes; for (m = 1; m < shaderstate.meshcount; m++) { mesh = shaderstate.meshes[m]; endi += mesh->numindexes; if (startv > mesh->vbofirstvert) startv = mesh->vbofirstvert; if (endv < mesh->vbofirstvert+mesh->numvertexes) endv = mesh->vbofirstvert+mesh->numvertexes; } ilst = alloca(endi*sizeof(index_t)); endi = 0; for (m = 0; m < shaderstate.meshcount; m++) { mesh = shaderstate.meshes[m]; for (starti = 0; starti < mesh->numindexes; ) ilst[endi++] = mesh->vbofirstvert + mesh->indexes[starti++]; } qglDrawRangeElements(batchtype, startv, endv, endi, GL_INDEX_TYPE, ilst); RQuantAdd(RQUANT_DRAWS, 1); } return; } #endif /* if (qglLockArraysEXT) { endv = 0; startv = 0x7fffffff; for (m = 0; m < shaderstate.meshcount; m++) { mesh = shaderstate.meshes[m]; starti = mesh->vbofirstvert; if (starti < startv) startv = starti; endi = mesh->vbofirstvert+mesh->numvertexes; if (endi > endv) endv = endi; } qglLockArraysEXT(startv, endv); } */ for (m = 0, mesh = shaderstate.meshes[0]; m < shaderstate.meshcount; ) { startv = mesh->vbofirstvert; starti = mesh->vbofirstelement; endv = startv+mesh->numvertexes; endi = starti+mesh->numindexes; //find consecutive surfaces for (++m; m < shaderstate.meshcount; m++) { mesh = shaderstate.meshes[m]; if (endi == mesh->vbofirstelement) { endv = mesh->vbofirstvert+mesh->numvertexes; endi = mesh->vbofirstelement+mesh->numindexes; } else { break; } } qglDrawRangeElements(batchtype, startv, endv, endi-starti, GL_INDEX_TYPE, (index_t*)shaderstate.sourcevbo->indicies.gl.addr + starti); RQuantAdd(RQUANT_DRAWS, 1); } /* if (qglUnlockArraysEXT) qglUnlockArraysEXT(); */ } static void DrawPass(const shaderpass_t *pass) { int i, j, k; int tmu; int lastpass = pass->numMergedPasses; unsigned int attr = (1u<upperoverlay)) continue; if (pass[i].texgen == T_GEN_LOWEROVERLAY && !TEXVALID(shaderstate.curtexnums->loweroverlay)) continue; if (pass[i].texgen == T_GEN_FULLBRIGHT && !TEXVALID(shaderstate.curtexnums->fullbright)) continue; break; } if (i == lastpass) return; BE_SendPassBlendDepthMask(pass[i].shaderbits); GenerateColourMods(pass+i); tmu = 0; for (; i < lastpass; i++) { if (pass[i].texgen == T_GEN_UPPEROVERLAY && !TEXVALID(shaderstate.curtexnums->upperoverlay)) continue; if (pass[i].texgen == T_GEN_LOWEROVERLAY && !TEXVALID(shaderstate.curtexnums->loweroverlay)) continue; if (pass[i].texgen == T_GEN_FULLBRIGHT && !TEXVALID(shaderstate.curtexnums->fullbright)) continue; Shader_BindTextureForPass(tmu, pass+i); attr |= (1u<<(VATTR_LEG_TMU0+tmu)); BE_GeneratePassTC(pass+i, tmu); BE_SetPassBlendMode(tmu, pass[i].blendmode); tmu++; //add in if (pass[i].texgen == T_GEN_LIGHTMAP) { //first pass should have been REPLACE //second pass should be an ADD //this depends upon rgbgens for light levels, so each pass *must* be pushed to hardware individually for (j = 1; j < MAXLIGHTMAPS && shaderstate.curbatch->lightmap[j] >= 0; j++) { if (j == 1) BE_SetPassBlendMode(tmu, PBM_REPLACE); /*make sure no textures linger*/ for (k = tmu; k < shaderstate.lastpasstmus; k++) { GL_LazyBind(k, 0, r_nulltex); } shaderstate.lastpasstmus = tmu; /*push it*/ BE_EnableShaderAttributes(attr, 0); BE_SubmitMeshChain(); tmu = 0; /*bind the light texture*/ GL_LazyBind(tmu, GL_TEXTURE_2D, lightmap[shaderstate.curbatch->lightmap[j]]->lightmap_texture); /*set up the colourmod for this style's lighting*/ shaderstate.pendingcolourvbo = 0; shaderstate.pendingcolourpointer = NULL; shaderstate.pendingcolourflat[0] = shaderstate.identitylighting * d_lightstylevalue[shaderstate.curbatch->lightstyle[j]]/256.0f; shaderstate.pendingcolourflat[1] = shaderstate.identitylighting * d_lightstylevalue[shaderstate.curbatch->lightstyle[j]]/256.0f; shaderstate.pendingcolourflat[2] = shaderstate.identitylighting * d_lightstylevalue[shaderstate.curbatch->lightstyle[j]]/256.0f; shaderstate.pendingcolourflat[3] = 1; /*pick the correct st coords for this lightmap pass*/ shaderstate.pendingtexcoordparts[tmu] = 2; shaderstate.pendingtexcoordvbo[tmu] = shaderstate.sourcevbo->lmcoord[j].gl.vbo; shaderstate.pendingtexcoordpointer[tmu] = shaderstate.sourcevbo->lmcoord[j].gl.addr; BE_SetPassBlendMode(tmu, PBM_ADD); BE_SendPassBlendDepthMask((pass[0].shaderbits & ~SBITS_BLEND_BITS) | SBITS_SRCBLEND_ONE | SBITS_DSTBLEND_ONE); attr = (1u< 1 && i != lastpass) { for (k = tmu; k < shaderstate.lastpasstmus; k++) { GL_LazyBind(k, 0, r_nulltex); } shaderstate.lastpasstmus = tmu; BE_EnableShaderAttributes(attr, 0); BE_SubmitMeshChain(); tmu = 0; BE_SendPassBlendDepthMask(pass[i+1].shaderbits); GenerateColourMods(&pass[i+1]); } } } if (!tmu) return; for (i = tmu; i < shaderstate.lastpasstmus; i++) { GL_LazyBind(i, 0, r_nulltex); } shaderstate.lastpasstmus = tmu; BE_EnableShaderAttributes(attr, 0); BE_SubmitMeshChain(); } static void BE_Program_Set_Attributes(const program_t *prog, unsigned int perm, qboolean entunchanged) { vec4_t param4; int r, g, b; int i; unsigned int ph; const shaderprogparm_t *p; /*don't bother setting it if the ent properties are unchanged (but do if the mesh changed)*/ if (entunchanged) return; for (i = 0; i < prog->numparams; i++) { p = &prog->parm[i]; ph = prog->permu[perm].parm[i]; if (ph == -1) continue; /*not in this permutation*/ switch(p->type) { case SP_M_VIEW: qglUniformMatrix4fvARB(ph, 1, false, r_refdef.m_view); break; case SP_M_PROJECTION: qglUniformMatrix4fvARB(ph, 1, false, r_refdef.m_projection); break; case SP_M_MODELVIEW: qglUniformMatrix4fvARB(ph, 1, false, shaderstate.modelviewmatrix); break; case SP_M_MODELVIEWPROJECTION: { float m16[16]; Matrix4_Multiply(r_refdef.m_projection, shaderstate.modelviewmatrix, m16); qglUniformMatrix4fvARB(ph, 1, false, m16); } break; case SP_M_INVMODELVIEWPROJECTION: { float m16[16], inv[16]; Matrix4_Multiply(r_refdef.m_projection, shaderstate.modelviewmatrix, m16); Matrix4_Invert(m16, inv); qglUniformMatrix4fvARB(ph, 1, false, inv); } break; case SP_M_MODEL: qglUniformMatrix4fvARB(ph, 1, false, shaderstate.modelmatrix); break; case SP_M_ENTBONES: { qglUniformMatrix3x4fv(ph, shaderstate.sourcevbo->numbones, false, shaderstate.sourcevbo->bones); } break; case SP_M_INVVIEWPROJECTION: { float m16[16], inv[16]; Matrix4_Multiply(r_refdef.m_projection, r_refdef.m_view, m16); Matrix4_Invert(m16, inv); qglUniformMatrix4fvARB(ph, 1, false, inv); } break; case SP_E_VBLEND: qglUniform2fvARB(ph, 1, shaderstate.meshes[0]->xyz_blendw); break; case SP_E_LMSCALE: if (perm & PERMUTATION_LIGHTSTYLES) { vec4_t colscale[MAXLIGHTMAPS]; int j, s; for (j = 0; j < MAXLIGHTMAPS ; j++) { s = shaderstate.curbatch->lightstyle[j]; if (s == 255) { for (; j < MAXLIGHTMAPS ; j++) { colscale[j][0] = 0; colscale[j][1] = 0; colscale[j][2] = 0; colscale[j][3] = 1; } break; } if (shaderstate.curentity->model && shaderstate.curentity->model->engineflags & MDLF_NEEDOVERBRIGHT) { float sc = (1<model && shaderstate.curentity->model->engineflags & MDLF_NEEDOVERBRIGHT) { float sc = (1<glowmod); break; case SP_E_ORIGIN: qglUniform3fvARB(ph, 1, (GLfloat*)shaderstate.curentity->origin); break; case SP_E_COLOURS: qglUniform4fvARB(ph, 1, (GLfloat*)shaderstate.curentity->shaderRGBAf); break; case SP_E_COLOURSIDENT: if (shaderstate.flags & BEF_FORCECOLOURMOD) qglUniform4fvARB(ph, 1, (GLfloat*)shaderstate.curentity->shaderRGBAf); else qglUniform4fARB(ph, 1, 1, 1, shaderstate.curentity->shaderRGBAf[3]); break; case SP_E_TOPCOLOURS: R_FetchTopColour(&r, &g, &b); param4[0] = r/255.0f; param4[1] = g/255.0f; param4[2] = b/255.0f; qglUniform3fvARB(ph, 1, param4); break; case SP_E_BOTTOMCOLOURS: R_FetchBottomColour(&r, &g, &b); param4[0] = r/255.0f; param4[1] = g/255.0f; param4[2] = b/255.0f; qglUniform3fvARB(ph, 1, param4); break; case SP_RENDERTEXTURESCALE: if (r_config.texture_non_power_of_two) { param4[0] = 1; param4[1] = 1; } else { r = 1; g = 1; while (r < vid.pixelwidth) r *= 2; while (g < vid.pixelheight) g *= 2; param4[0] = vid.pixelwidth/(float)r; param4[1] = vid.pixelheight/(float)g; } param4[2] = 0; param4[3] = 0; qglUniform4fvARB(ph, 1, param4); break; case SP_LIGHTSCREEN: { float v[4], tempv[4]; v[0] = shaderstate.lightorg[0]; v[1] = shaderstate.lightorg[1]; v[2] = shaderstate.lightorg[2]; v[3] = 1; Matrix4x4_CM_Transform4(shaderstate.modelviewmatrix, v, tempv); Matrix4x4_CM_Transform4(r_refdef.m_projection, tempv, v); v[3] *= 2; v[0] = (v[0]/v[3]) + 0.5; v[1] = (v[1]/v[3]) + 0.5; v[2] = (v[2]/v[3]) + 0.5; qglUniform3fvARB(ph, 1, v); } break; case SP_LIGHTRADIUS: qglUniform1fARB(ph, shaderstate.lightradius); break; case SP_LIGHTCOLOUR: qglUniform3fvARB(ph, 1, shaderstate.lightcolours); break; case SP_W_FOG: qglUniform4fvARB(ph, 1, r_refdef.gfog_rgbd); break; case SP_V_EYEPOS: qglUniform3fvARB(ph, 1, r_origin); break; case SP_E_EYEPOS: { /*eye position in model space*/ vec3_t t2; Matrix4x4_CM_Transform3(shaderstate.modelmatrixinv, r_origin, t2); qglUniform3fvARB(ph, 1, t2); } break; case SP_LIGHTPOSITION: { /*light position in model space*/ vec3_t t2; Matrix4x4_CM_Transform3(shaderstate.modelmatrixinv, shaderstate.lightorg, t2); qglUniform3fvARB(ph, 1, t2); } break; case SP_LIGHTCOLOURSCALE: qglUniform3fvARB(ph, 1, shaderstate.lightcolourscale); break; case SP_LIGHTPROJMATRIX: { float t[16]; Matrix4x4_CM_Projection_Far(t, 90, 90, 4, 3000); qglUniformMatrix4fvARB(ph, 1, false, t); } break; case SP_LIGHTCUBEMATRIX: /*light's texture projection matrix*/ { float t[16]; Matrix4_Multiply(shaderstate.modelmatrix, shaderstate.lightprojmatrix, t); qglUniformMatrix4fvARB(ph, 1, false, t); } break; case SP_LIGHTSHADOWMAPINFO: qglUniform4fvARB(ph, 1, shaderstate.lightshadowmapinfo); break; /*static lighting info*/ case SP_E_L_DIR: qglUniform3fvARB(ph, 1, (float*)shaderstate.curentity->light_dir); break; case SP_E_L_MUL: qglUniform3fvARB(ph, 1, (float*)shaderstate.curentity->light_range); break; case SP_E_L_AMBIENT: qglUniform3fvARB(ph, 1, (float*)shaderstate.curentity->light_avg); break; case SP_E_TIME: qglUniform1fARB(ph, shaderstate.curtime); break; case SP_CONSTI: case SP_TEXTURE: qglUniform1iARB(ph, p->ival); break; case SP_CONSTF: qglUniform1fARB(ph, p->fval); break; case SP_CVARI: qglUniform1iARB(ph, ((cvar_t*)p->pval)->ival); break; case SP_CVARF: qglUniform1fARB(ph, ((cvar_t*)p->pval)->value); break; case SP_CVAR3F: { cvar_t *var = (cvar_t*)p->pval; char *vs = var->string; vs = COM_Parse(vs); param4[0] = atof(com_token); vs = COM_Parse(vs); param4[1] = atof(com_token); vs = COM_Parse(vs); param4[2] = atof(com_token); qglUniform3fvARB(ph, 1, param4); } break; default: Host_EndGame("Bad shader program parameter type (%i)", p->type); break; } } } static void BE_RenderMeshProgram(const shader_t *shader, const shaderpass_t *pass) { program_t *p = shader->prog; int i; int perm; perm = 0; if (shaderstate.sourcevbo->numbones) { if (p->permu[perm|PERMUTATION_SKELETAL].handle.glsl) perm |= PERMUTATION_SKELETAL; else return; } if (p->permu[perm|PERMUTATION_FRAMEBLEND].handle.glsl && shaderstate.sourcevbo->coord2.gl.addr) perm |= PERMUTATION_FRAMEBLEND; if (TEXVALID(shaderstate.curtexnums->bump) && p->permu[perm|PERMUTATION_BUMPMAP].handle.glsl) perm |= PERMUTATION_BUMPMAP; if (TEXVALID(shaderstate.curtexnums->fullbright) && p->permu[perm|PERMUTATION_FULLBRIGHT].handle.glsl) perm |= PERMUTATION_FULLBRIGHT; if ((TEXVALID(shaderstate.curtexnums->loweroverlay) || TEXVALID(shaderstate.curtexnums->upperoverlay)) && p->permu[perm|PERMUTATION_UPPERLOWER].handle.glsl) perm |= PERMUTATION_UPPERLOWER; if (r_refdef.gfog_rgbd[3] && p->permu[perm|PERMUTATION_FOG].handle.glsl) perm |= PERMUTATION_FOG; if (p->permu[perm|PERMUTATION_DELUXE].handle.glsl && TEXVALID(shaderstate.curtexnums->bump) && shaderstate.curbatch->lightmap[0] >= 0 && lightmap[shaderstate.curbatch->lightmap[0]]->hasdeluxe) perm |= PERMUTATION_DELUXE; if (shaderstate.curbatch->lightmap[1] >= 0 && p->permu[perm|PERMUTATION_LIGHTSTYLES].handle.glsl) perm |= PERMUTATION_LIGHTSTYLES; GL_SelectProgram(p->permu[perm].handle.glsl); #ifndef FORCESTATE if (shaderstate.lastuniform == p->permu[perm].handle.glsl) i = true; else #endif { i = false; shaderstate.lastuniform = p->permu[perm].handle.glsl; } BE_Program_Set_Attributes(p, perm, i); BE_SendPassBlendDepthMask(pass->shaderbits); BE_EnableShaderAttributes(p->permu[perm].attrmask, shaderstate.sourcevbo->vao); if (p->nofixedcompat) { for (i = 0; i < pass->numMergedPasses; i++) { Shader_BindTextureForPass(i, pass+i); } if (perm & PERMUTATION_LIGHTSTYLES) { GL_LazyBind(i++, GL_TEXTURE_2D, shaderstate.curbatch->lightmap[1] >= 0?lightmap[shaderstate.curbatch->lightmap[1]]->lightmap_texture:r_nulltex); GL_LazyBind(i++, GL_TEXTURE_2D, shaderstate.curbatch->lightmap[2] >= 0?lightmap[shaderstate.curbatch->lightmap[2]]->lightmap_texture:r_nulltex); GL_LazyBind(i++, GL_TEXTURE_2D, shaderstate.curbatch->lightmap[3] >= 0?lightmap[shaderstate.curbatch->lightmap[3]]->lightmap_texture:r_nulltex); //we need this loop to fix up fixed-function stuff for (; i < shaderstate.lastpasstmus; i++) { GL_LazyBind(i, 0, r_nulltex); } shaderstate.lastpasstmus = pass->numMergedPasses+3; } else { //we need this loop to fix up fixed-function stuff for (; i < shaderstate.lastpasstmus; i++) { GL_LazyBind(i, 0, r_nulltex); } shaderstate.lastpasstmus = pass->numMergedPasses; } } else { GenerateColourMods(pass); for (i = 0; i < pass->numMergedPasses; i++) { Shader_BindTextureForPass(i, pass+i); BE_GeneratePassTC(pass+i, i); } for (; i < shaderstate.lastpasstmus; i++) { GL_LazyBind(i, 0, r_nulltex); } shaderstate.lastpasstmus = pass->numMergedPasses; } BE_SubmitMeshChain(); } qboolean GLBE_LightCullModel(vec3_t org, model_t *model) { #ifdef RTLIGHTS if ((shaderstate.mode == BEM_LIGHT || shaderstate.mode == BEM_STENCIL || shaderstate.mode == BEM_DEPTHONLY)) { float dist; vec3_t disp; if (model->type == mod_alias) { VectorSubtract(org, shaderstate.lightorg, disp); dist = DotProduct(disp, disp); if (dist > model->radius*model->radius + shaderstate.lightradius*shaderstate.lightradius) return true; } else { int i; for (i = 0; i < 3; i++) { if (shaderstate.lightorg[i]-shaderstate.lightradius > org[i] + model->maxs[i]) return true; if (shaderstate.lightorg[i]+shaderstate.lightradius < org[i] + model->mins[i]) return true; } } } #endif return false; } //Note: Be cautious about using BEM_LIGHT here, as it won't select the light. void GLBE_SelectMode(backendmode_t mode) { extern int gldepthfunc; if (mode != shaderstate.mode) { shaderstate.mode = mode; shaderstate.flags = 0; switch (mode) { default: break; case BEM_DEPTHONLY: GL_DeSelectProgram(); /*BEM_DEPTHONLY does support mesh writing, but its not the only way its used... FIXME!*/ while(shaderstate.lastpasstmus>0) { GL_LazyBind(--shaderstate.lastpasstmus, 0, r_nulltex); } //we don't write or blend anything (maybe alpha test... but mneh) BE_SendPassBlendDepthMask(SBITS_MISC_DEPTHWRITE | SBITS_MASK_BITS); BE_SetPassBlendMode(0, PBM_REPLACE); GL_CullFace(SHADER_CULL_FRONT); break; #ifdef RTLIGHTS case BEM_STENCIL: /*BEM_STENCIL doesn't support mesh writing*/ GLBE_PushOffsetShadow(false); if (gl_config.nofixedfunc && !shaderstate.allblackshader) { char *defs[] = {NULL}; shaderstate.allblackshader = GLSlang_CreateProgram("allblackprogram", gl_config.gles?100:110, defs, "#include \"sys/skeletal.h\"\nvoid main(){gl_Position = skeletaltransform();}", "void main(){gl_FragColor=vec4(0.0,0.0,0.0,1.0);}", false); } //disable all tmus while(shaderstate.lastpasstmus>0) { GL_LazyBind(--shaderstate.lastpasstmus, 0, r_nulltex); } if (!gl_config.nofixedfunc) { GL_DeSelectProgram(); //replace mode please BE_SetPassBlendMode(0, PBM_REPLACE); } //we don't write or blend anything (maybe alpha test... but mneh) BE_SendPassBlendDepthMask(SBITS_MISC_DEPTHCLOSERONLY | SBITS_MASK_BITS); GL_CullFace(0); //don't change cull stuff, and //don't actually change stencil stuff - caller needs to be //aware of how many times stuff is drawn, so they can do that themselves. break; case BEM_CREPUSCULAR: if (!shaderstate.crepopaqueshader) { shaderstate.crepopaqueshader = R_RegisterShader("crepuscular_opaque", "{\n" "program crepuscular_opaque\n" "}\n" ); } if (!shaderstate.crepskyshader) { shaderstate.crepskyshader = R_RegisterShader("crepuscular_sky", "{\n" "program crepuscular_sky\n" "{\n" "map $diffuse\n" "}\n" "{\n" "map $fullbright\n" "}\n" "}\n" ); } break; #endif case BEM_FOG: while(shaderstate.lastpasstmus>0) { GL_LazyBind(--shaderstate.lastpasstmus, 0, r_nulltex); } GL_LazyBind(0, GL_TEXTURE_2D, shaderstate.fogtexture); shaderstate.lastpasstmus = 1; Vector4Set(shaderstate.pendingcolourflat, 1, 1, 1, 1); shaderstate.pendingcolourvbo = 0; shaderstate.pendingcolourpointer = NULL; BE_SetPassBlendMode(0, PBM_MODULATE); BE_SendPassBlendDepthMask(SBITS_SRCBLEND_SRC_ALPHA | SBITS_DSTBLEND_ONE_MINUS_SRC_ALPHA | SBITS_MISC_DEPTHEQUALONLY); break; } } } void GLBE_SelectEntity(entity_t *ent) { float nd; shaderstate.curentity = ent; currententity = ent; R_RotateForEntity(shaderstate.modelmatrix, shaderstate.modelviewmatrix, shaderstate.curentity, shaderstate.curentity->model); Matrix4_Invert(shaderstate.modelmatrix, shaderstate.modelmatrixinv); if (qglLoadMatrixf) qglLoadMatrixf(shaderstate.modelviewmatrix); if (shaderstate.curentity->flags & Q2RF_DEPTHHACK) nd = 0.3; else nd = 1; if (shaderstate.depthrange != nd) { shaderstate.depthrange = nd; if (qglDepthRange) qglDepthRange (gldepthmin, gldepthmin + shaderstate.depthrange*(gldepthmax-gldepthmin)); else if (qglDepthRangef) qglDepthRangef (gldepthmin, gldepthmin + shaderstate.depthrange*(gldepthmax-gldepthmin)); } shaderstate.lastuniform = 0; shaderstate.curtime = shaderstate.updatetime - shaderstate.curentity->shaderTime; } #if 0 static void BE_SelectFog(vec3_t colour, float alpha, float density) { float zscale; density /= 64; zscale = 2048; /*this value is meant to be the distance at which fog the value becomes as good as fully fogged, just hack it to 2048...*/ GenerateFogTexture(&shaderstate.fogtexture, density, zscale); shaderstate.fogfar = 1/zscale; /*scaler for z coords*/ qglColor4f(colour[0], colour[1], colour[2], alpha); } #endif #ifdef RTLIGHTS static qboolean GLBE_RegisterLightShader(int mode) { if (!shaderstate.inited_shader_light[mode]) { char *name = va("rtlight%s%s%s", (mode & (1u<prog) { shaderstate.shader_light[mode] = NULL; } } if (shaderstate.shader_light[mode]) return true; return false; } #endif void GLBE_SelectDLight(dlight_t *dl, vec3_t colour) { float view[16], proj[16]; int lmode; extern cvar_t gl_specular; extern cvar_t r_shadow_shadowmapping; /*generate light projection information*/ float nearplane = 4; if (dl->fov) { Matrix4x4_CM_Projection_Far(proj, dl->fov, dl->fov, nearplane, dl->radius); Matrix4x4_CM_ModelViewMatrixFromAxis(view, dl->axis[0], dl->axis[1], dl->axis[2], dl->origin); Matrix4_Multiply(proj, view, shaderstate.lightprojmatrix); } else { Matrix4x4_CM_Projection_Far(proj, 90, 90, nearplane, dl->radius); Matrix4x4_CM_ModelViewMatrixFromAxis(shaderstate.lightprojmatrix, dl->axis[0], dl->axis[1], dl->axis[2], dl->origin); } /*simple info*/ shaderstate.lightradius = dl->radius; VectorCopy(dl->origin, shaderstate.lightorg); VectorCopy(dl->lightcolourscales, shaderstate.lightcolourscale); shaderstate.lightcolourscale[2] *= gl_specular.value; VectorCopy(colour, shaderstate.lightcolours); #ifdef RTLIGHTS shaderstate.lightcubemap = dl->cubetexture; #endif shaderstate.lastuniform = 0; lmode = 0; #ifdef RTLIGHTS if (((dl->flags & LFLAG_SHADOWMAP) || r_shadow_shadowmapping.ival) && GLBE_RegisterLightShader(lmode | (1u<fov && GLBE_RegisterLightShader(lmode | (1u<