226 lines
7.0 KiB
226 lines
7.0 KiB
|
|
vs.1.1 |
|
|
|
dcl_position v0 |
|
dcl_color v5 |
|
dcl_texcoord0 v7 |
|
|
|
// Store our input position in world space in r6 |
|
m4x3 r6, v0, c25; // v0 * l2w |
|
// Fill out our w (m4x3 doesn't touch w). |
|
mov r6.w, c16.z; |
|
|
|
// |
|
|
|
// Input diffuse v5 color is: |
|
// v5.r = overall transparency |
|
// v5.g = reflection strength (transparency) |
|
// v5.b = overall wave scaling |
|
// |
|
// v5.a is: |
|
// v5.w = 1/(2.f * edge length) |
|
// So per wave filtering is: |
|
// min(max( (waveLen * v5.wwww) - 1), 0), 1.f); |
|
// So a wave effect starts dying out when the wave is 4 times the sampling frequency, |
|
// and is completely filtered at 2 times sampling frequency. |
|
|
|
// We'd like to make this autocalculated based on the depth of the water. |
|
// The frequency filtering (v5.w) still needs to be calculated offline, because |
|
// it's dependent on edge length, but the first 3 filterings can be calculated |
|
// based on this vertex. |
|
// Basically, we want the transparency, reflection strength, and wave scaling |
|
// to go to zero as the water depth goes to zero. Linear falloffs are as good |
|
// a place to start as any. |
|
// |
|
// depth = waterlevel - r6.z => depth in feet (may be negative) |
|
// depthNorm = depth / depthFalloff => zero at watertable, one at depthFalloff beneath |
|
// atten = minAtten + depthNorm * (maxAtten - minAtten); |
|
// These are all vector ops. |
|
// This provides separate ramp ups for each of the channels (they reach full unfiltered |
|
// values at different depths), but doesn't provide separate controls for where they |
|
// go to zero (they all go to zero at zero depth). For that we need an offset. An offset |
|
// in feet (depth) is probably the most intuitive. So that changes the first calculation |
|
// of depth to: |
|
// depth = waterlevel - r6.z + offset |
|
// = (waterlevel + offset) - r6.z |
|
// And since we only need offsets for 3 channels, we can make the waterlevel constant |
|
// waterlevel[chan] = watertableheight + offset[chan], |
|
// with waterlevel.w = watertableheight. |
|
// |
|
// So: |
|
// c30 = waterlevel + offset |
|
// c31 = (maxAtten - minAtten) / depthFalloff |
|
// c32 = minAtten. |
|
// And in particular: |
|
// c30.w = waterlevel |
|
// c31.w = 1.f; |
|
// c32.w = 0; |
|
// So r4.w is the depth of this vertex in feet. |
|
|
|
// Dot our position with our direction vectors. |
|
mul r0, c8, r6.xxxx; |
|
mad r0, c9, r6.yyyy, r0; |
|
|
|
// |
|
// dist = mad( dist, kFreq.xyzw, kPhase.xyzw); |
|
mul r0, r0, c5; |
|
add r0, r0, c6; |
|
// |
|
// // Now we need dist mod'd into range [-Pi..Pi] |
|
// dist *= rcp(kTwoPi); |
|
rcp r4, c15.wwww; |
|
add r0, r0, c15.zzzz; |
|
mul r0, r0, r4; |
|
// dist = frac(dist); |
|
expp r1.y, r0.xxxx |
|
mov r1.x, r1.yyyy |
|
expp r1.y, r0.zzzz |
|
mov r1.z, r1.yyyy |
|
expp r1.y, r0.wwww |
|
mov r1.w, r1.yyyy |
|
expp r1.y, r0.yyyy |
|
// dist *= kTwoPi; |
|
mul r0, r1, c15.wwww; |
|
// dist += -kPi; |
|
sub r0, r0, c15.zzzz; |
|
|
|
// |
|
// sincos(dist, sinDist, cosDist); |
|
// sin = r0 + r0^3 * vSin.y + r0^5 * vSin.z |
|
// cos = 1 + r0^2 * vCos.y + r0^4 * vCos.z |
|
mul r1, r0, r0; // r0^2 |
|
mul r2, r1, r0; // r0^3 - probably stall |
|
mul r3, r1, r1; // r0^4 |
|
mul r4, r1, r2; // r0^5 |
|
mul r5, r2, r3; // r0^7 |
|
|
|
mul r1, r1, c14.yyyy; // r1 = r0^2 * vCos.y |
|
mad r2, r2, c13.yyyy, r0; // r2 = r0 + r0^3 * vSin.y |
|
add r1, r1, c14.xxxx; // r1 = 1 + r0^2 * vCos.y |
|
mad r2, r4, c13.zzzz, r2; // r2 = r0 + r0^3 * vSin.y + r0^5 * vSin.z |
|
mad r1, r3, c14.zzzz, r1; // r1 = 1 + r0^2 * vCos.y + r0^4 * vCos.z |
|
|
|
// r0^7 & r0^6 terms |
|
mul r4, r4, r0; // r0^6 |
|
mad r2, r5, c13.wwww, r2; |
|
mad r1, r4, c14.wwww, r1; |
|
|
|
// Calc our depth based filtering here into r4 (because we don't use it again |
|
// after here, and we need our filtering shortly). |
|
sub r4, c30, r6.zzzz; |
|
mul r4, r4, c31; |
|
add r4, r4, c32; |
|
// Clamp .xyz to range [0..1] |
|
min r4.xyz, r4, c16.zzzz; |
|
max r4.xyz, r4, c16.xxxx; |
|
//mov r4.xyz, c16.xxx; // HACKTEST |
|
|
|
// Calc our filter (see above). |
|
mul r11, v5.wwww, c29; |
|
max r11, r11, c16.xxxx; |
|
min r11, r11, c16.zzzz; |
|
|
|
//mov r2, r1; |
|
// r2 == sinDist |
|
// r1 == cosDist |
|
// sinDist *= filter; |
|
mul r2, r2, r11; |
|
// sinDist *= kAmplitude.xyzw |
|
mul r2, r2, c7; |
|
// height = dp4(sinDist, kOne); |
|
// accumPos.z += height; (but accumPos.z is currently 0). |
|
dp4 r8.x, r2, c16.zzzz; |
|
mul r8.y, r8.x, r4.z; |
|
add r8.z, r8.y, c30.w; |
|
max r6.z, r6.z, r8.z; |
|
// r8.x == wave height relative to 0 |
|
// r8.y == dampened wave relative to 0 |
|
// r8.z == dampened wave height in world space |
|
// r6.z == wave height clamped to never go beneath ground level |
|
// |
|
// cosDist *= filter; |
|
mul r1, r1, r11; |
|
|
|
// Pos = (in.x + S, in.y + R, r6.z) |
|
// S = sum(k Dir.x A cos()) |
|
// R = sum(k Dir.y A cos()) |
|
// c10 = k Dir.x A |
|
// c11 = k Dir.y A |
|
// S = sum(cosDist * c10); |
|
dp4 r7.x, r1, c10; |
|
// R = sum(cosDist * c11); |
|
dp4 r7.y, r1, c11; |
|
|
|
add r6.xy, r6.xy, r7.xy; |
|
|
|
|
|
// Bias our vert up a bit to compensate for precision errors. |
|
// In particular, our filter coefficients are coming in as |
|
// interpolated bytes, so there's bound to be a lot of slop |
|
// from that. We've got a free slot in c35.z, so we'll use that. |
|
// A better implementation would be to bias and scale our screen |
|
// vert, effectively pushing the vert toward the camera without |
|
// actually moving it, but this is easier and might work just |
|
// as well. |
|
add r6.z, r6.z, c35.z; |
|
|
|
// |
|
// // Transform position to screen |
|
// |
|
// |
|
//m4x3 r6, v0, c25; // HACKAGE |
|
//mov r6.w, c16.z; // HACKAGE |
|
//m4x4 oPos, r6, c0; // ADDFOG |
|
m4x4 r9, r6, c0; |
|
add r10.x, r9.w, c4.x; |
|
mul oFog, r10.x, c4.y; |
|
mov oPos, r9; |
|
|
|
|
|
// Dyna Stuff |
|
// Constants |
|
// c33 = fC1U, fC2U, fC1V, fC2V |
|
// c34 = fInitAtten, t, life, 1.f / (life-decay) |
|
// c35 = ramp, 1.f / ramp, BIAS (positive is up), FREE |
|
// |
|
// Vertex Info |
|
// v7.z = fBirth (because we don't use it for anything else). |
|
// |
|
// Initialize r1.zw to 0,1 |
|
mov r1, c16.xxxz; |
|
// Calc r1.x = age, r1.y = atten |
|
// age = t - birth. |
|
sub r1.x, c34.y, v7.z; |
|
// atten = clamp0_1(age / ramp) * clamp0_1((life-age) / (life-decay)); |
|
// first clamp0_1(age/ramp) |
|
mul r1.y, r1.x, c35.y; |
|
min r1.y, r1.y, c16.z; // Clamp to one (can't go negative). |
|
// now clamp0_1((life-age) / (life-decay)); |
|
sub r1.z, c34.z, r1.x; |
|
mul r1.z, r1.z, c34.w; |
|
min r1.z, r1.z, c16.z; // Clamp to one |
|
max r1.z, r1.z, c16.x; // Clamp to zero |
|
mul r1.y, r1.y, r1.z; // atten is the product of the two terms. |
|
|
|
// color is (atten, atten, atten, 1.f) |
|
// Need to calculate opacity we would have had from vs_WaveFixedFin7.inl |
|
// Right now that's just modulating by r4.y. |
|
mul r0.y, r4.y, c34.x; |
|
mul oD0, r0.yyyy, r1.yyyw; |
|
//mov oD0, c16.zzzz; // HACKTEST |
|
|
|
// UVW = (inUVW - 0.5) * scale + 0.5 |
|
// where: |
|
// scale = (fC1U / (age * fC2U + 1.f)), fC1V / (age * fC2U + 1.f), 1.f, 1.f |
|
mov r2, c16.xxxz; |
|
mul r2.xy, r1.xx, c33.yw; |
|
add r2.xy, r2.xy, c16.zz; |
|
rcp r2.x, r2.x; |
|
rcp r2.y, r2.y; |
|
mul r2.xy, r2.xy, c33.xz; |
|
sub r1.xy, v7.xy, c16.yy; |
|
mul r1.xy, r1.xy, r2.xy; |
|
add r1.xy, r1.xy, c16.yy; |
|
mov oT0, r1; |
|
|
|
|
|
|