cemu_graphic_packs/Enhancements/NewSuperMarioBrosU_FancyFX/03285368cf940e37_0000000000000079_ps.txt

#version 420
#extension GL_ARB_texture_gather : enable
#extension GL_ARB_separate_shader_objects : enable
#ifdef VULKAN
#define ATTR_LAYOUT(__vkSet, __location) layout(set = __vkSet, location = __location)
#define UNIFORM_BUFFER_LAYOUT(__glLocation, __vkSet, __vkLocation) layout(set = __vkSet, binding = __vkLocation, std140)
#define TEXTURE_LAYOUT(__glLocation, __vkSet, __vkLocation) layout(set = __vkSet, binding = __vkLocation)
#define SET_POSITION(_v) gl_Position = _v; gl_Position.z = (gl_Position.z + gl_Position.w) / 2.0
#define GET_FRAGCOORD() vec4(gl_FragCoord.xy*uf_fragCoordScale.xy,gl_FragCoord.zw)
#define gl_VertexID gl_VertexIndex
#define gl_InstanceID gl_InstanceIndex
#else
#define ATTR_LAYOUT(__vkSet, __location) layout(location = __location)
#define UNIFORM_BUFFER_LAYOUT(__glLocation, __vkSet, __vkLocation) layout(binding = __glLocation, std140) 
#define TEXTURE_LAYOUT(__glLocation, __vkSet, __vkLocation) layout(binding = __glLocation)
#define SET_POSITION(_v) gl_Position = _v
#define GET_FRAGCOORD() vec4(gl_FragCoord.xy*uf_fragCoordScale,gl_FragCoord.zw)
#endif
// This shaders was auto-converted from OpenGL to Cemu so expect weird code and possible errors.

// shader 03285368cf940e37 //box bg

//float dither = $dither ;
//float scaleShader = $scaleShader;
float scaleBlur = $scaleBlur; //0.25 4k
const int sampleScale = 2;
//float lightBloom = 0.95; 


TEXTURE_LAYOUT(0, 1, 0) uniform sampler2D textureUnitPS0;// Tex0 addr 0xf4240800 res 1280x720x1 dim 1 tm: 4 format 001a compSel: 0 1 2 3 mipView: 0x0 (num 0x1
layout(location = 0) in vec4 passParameterSem3;
layout(location = 0) out vec4 passPixelColor0;
#ifdef VULKAN
layout(set = 1, binding = 1) uniform ufBlock
{
uniform vec4 uf_fragCoordScale;
};
#else
uniform vec2 uf_fragCoordScale;
#endif

// FabriceNeyret2 CC, single shader gaussian by intermediate MIPmap level. www.shadertoy.com/view/ltScRG
const int samples = 8 * sampleScale, //8 or 4 balances xy position
LOD = 2,         // gaussian done on MIPmap at scale LOD
sLOD = 1 << LOD; // tile size = 2^LOD
const float sigma = float(samples) * .25;

float gaussian(vec2 i) {
	return exp(-.5* dot(i /= sigma, i)) / (6.28 * sigma*sigma);
}

vec4 blur(sampler2D sp, vec2 U, vec2 scale) {
	vec4 O = vec4(0.0);
	int s = samples / sLOD;

	for (int i = 0; i < s*s; i++) {
		vec2 d = vec2(i%s, i / s)*float(sLOD) - float(samples) / 2.;
		O += gaussian(d) * textureLod(sp, U + scale * d, float(LOD));
	}

	//O / O.a;
	return vec4(O.x, O.y, O.z, 0.0)*18; //16 exact, 17 ~ a touch more haze to compensate res increase
}

int clampFI32(int v)
{
if( v == 0x7FFFFFFF )
	return floatBitsToInt(1.0);
else if( v == 0xFFFFFFFF )
	return floatBitsToInt(0.0);
return floatBitsToInt(clamp(intBitsToFloat(v), 0.0, 1.0));
}
float mul_nonIEEE(float a, float b){return mix(0.0, a*b, (a != 0.0) && (b != 0.0));}
void main()
{
vec4 R0f = vec4(0.0);
vec4 R1f = vec4(0.0);
vec4 R2f = vec4(0.0);
vec4 R3f = vec4(0.0);
vec4 R123f = vec4(0.0);
float backupReg0f, backupReg1f, backupReg2f, backupReg3f, backupReg4f;
vec4 PV0f = vec4(0.0), PV1f = vec4(0.0);
float PS0f = 0.0, PS1f = 0.0;
vec4 tempf = vec4(0.0);
float tempResultf;
int tempResulti;
ivec4 ARi = ivec4(0);
bool predResult = true;
vec3 cubeMapSTM;
int cubeMapFaceId;
R0f = passParameterSem3;

vec2 coord = passParameterSem3.xy*textureSize(textureUnitPS0, 0); //
vec2 ps = vec2(1.0) / textureSize(textureUnitPS0, 0);
vec2 uv = coord * ps;

R1f.xyz = blur(textureUnitPS0, R0f.xy, ps*scaleBlur).xyz; 
R2f.xyz = R1f.xyz;
R3f.xyz = R1f.xyz;
R0f.xyz = R1f.xyz;
/*
R1f.xyz = (texture(textureUnitPS0, R0f.xy).xyz);
R2f.xyz = (texture(textureUnitPS0, R0f.zy).xyz);
R3f.xyz = (texture(textureUnitPS0, R0f.xw).xyz);
R0f.xyz = (texture(textureUnitPS0, R0f.zw).xyz);
*/

// 0
PV0f.x = R1f.z + R2f.z;
PV0f.x /= 2.0;
PV0f.z = R1f.y + R2f.y;
PV0f.z /= 2.0;
PV0f.w = R1f.x + R2f.x;
PV0f.w /= 2.0;
// 1
R123f.x = (R3f.y * 0.5 + PV0f.z);
PV1f.x = R123f.x;
R123f.y = (R3f.x * 0.5 + PV0f.w);
PV1f.y = R123f.y;
R123f.w = (R3f.z * 0.5 + PV0f.x);
PV1f.w = R123f.w;
// 2
backupReg0f = R0f.x;
backupReg1f = R0f.y;
backupReg2f = R0f.z;
R0f.x = (backupReg0f * 0.5 + PV1f.y)/2.0;
R0f.y = (backupReg1f * 0.5 + PV1f.x)/2.0;
R0f.z = (backupReg2f * 0.5 + PV1f.w)/2.0;
// export
passPixelColor0 = vec4(R0f.x, R0f.y, R0f.z, R0f.w);
}
New super mario bros 1..4.x - Rules n shaders 2018-10-31 18:48:11 +01:00			`#version 420`
			`#extension GL_ARB_texture_gather : enable`
			`#extension GL_ARB_separate_shader_objects : enable`
Update every graphic pack to V4 Since it's not possible to update 300+ shaders manually and automation was possible, I thought that I'd take the honor and create a script that's able to automatically convert all of the shaders to be cross-compatible with Vulkan. And change the graphic pack versions to version 4 of course. Also, the script has some nifty testing code which compiled every shader as OpenGL and Vulkan, but for that see the details that I've written below. Here's the script that I've made to do all of this. No manual edits were needed: https://gist.github.com/Crementif/8d98a855b95f219d95298fb3db99deae 2019-11-29 04:36:05 +01:00			`#ifdef VULKAN`
			`#define ATTR_LAYOUT(__vkSet, __location) layout(set = __vkSet, location = __location)`
			`#define UNIFORM_BUFFER_LAYOUT(__glLocation, __vkSet, __vkLocation) layout(set = __vkSet, binding = __vkLocation, std140)`
			`#define TEXTURE_LAYOUT(__glLocation, __vkSet, __vkLocation) layout(set = __vkSet, binding = __vkLocation)`
			`#define SET_POSITION(_v) gl_Position = _v; gl_Position.z = (gl_Position.z + gl_Position.w) / 2.0`
			`#define GET_FRAGCOORD() vec4(gl_FragCoord.xy*uf_fragCoordScale.xy,gl_FragCoord.zw)`
			`#define gl_VertexID gl_VertexIndex`
			`#define gl_InstanceID gl_InstanceIndex`
			`#else`
			`#define ATTR_LAYOUT(__vkSet, __location) layout(location = __location)`
			`#define UNIFORM_BUFFER_LAYOUT(__glLocation, __vkSet, __vkLocation) layout(binding = __glLocation, std140)`
			`#define TEXTURE_LAYOUT(__glLocation, __vkSet, __vkLocation) layout(binding = __glLocation)`
			`#define SET_POSITION(_v) gl_Position = _v`
			`#define GET_FRAGCOORD() vec4(gl_FragCoord.xy*uf_fragCoordScale,gl_FragCoord.zw)`
			`#endif`
			`// This shaders was auto-converted from OpenGL to Cemu so expect weird code and possible errors.`

New super mario bros 1..4.x - Rules n shaders 2018-10-31 18:48:11 +01:00			`// shader 03285368cf940e37 //box bg`

Update 03285368cf940e37_0000000000000079_ps.txt fixes a compile error of this shader in cemu Portuguese language localization 2018-12-14 20:49:18 -07:00			`//float dither = $dither ;`
			`//float scaleShader = $scaleShader;`
Fix shader errors and shader cleanup Since I wanted to make sure that I didn't broke the shaders after converting the shaders to Vulkan, we need to check if all the shaders weren't broken. Since we're talking about like 400 shaders checking all of them is pretty much impossible and even then, So, the obvious solution was to automate the checking. Not as simple as you'd think, because in 300 of our shaders we use preset variables which without replacing the value like Cemu does, will make the shader error regardless. So I also implemented some functionality that would read the preset values and types out of the rules.txt file and replace them in the shaders using that information. And then we use Khronos' glslang to compile the shaders, using both OpenGL and Vulkan. The result was that glslang found quite a few errors in some of the shaders, which I fixed in this commit. I'm considering adding this rules.txt parsing and automated shader compilation testing to the build process. Also, I fixed Clarity's name and description since Monochromia isn't available anymore and Xenoblade's resolution pack had a lot of weird blank lines before their #version declaration, which my converter didn't like. 2019-11-29 00:51:00 +01:00			`float scaleBlur = $scaleBlur; //0.25 4k`
			`const int sampleScale = 2;`
Update 03285368cf940e37_0000000000000079_ps.txt fixes a compile error of this shader in cemu Portuguese language localization 2018-12-14 20:49:18 -07:00			`//float lightBloom = 0.95;`
New super mario bros 1..4.x - Rules n shaders 2018-10-31 18:48:11 +01:00

Update every graphic pack to V4 Since it's not possible to update 300+ shaders manually and automation was possible, I thought that I'd take the honor and create a script that's able to automatically convert all of the shaders to be cross-compatible with Vulkan. And change the graphic pack versions to version 4 of course. Also, the script has some nifty testing code which compiled every shader as OpenGL and Vulkan, but for that see the details that I've written below. Here's the script that I've made to do all of this. No manual edits were needed: https://gist.github.com/Crementif/8d98a855b95f219d95298fb3db99deae 2019-11-29 04:36:05 +01:00			`TEXTURE_LAYOUT(0, 1, 0) uniform sampler2D textureUnitPS0;// Tex0 addr 0xf4240800 res 1280x720x1 dim 1 tm: 4 format 001a compSel: 0 1 2 3 mipView: 0x0 (num 0x1`
New super mario bros 1..4.x - Rules n shaders 2018-10-31 18:48:11 +01:00			`layout(location = 0) in vec4 passParameterSem3;`
			`layout(location = 0) out vec4 passPixelColor0;`
Update every graphic pack to V4 Since it's not possible to update 300+ shaders manually and automation was possible, I thought that I'd take the honor and create a script that's able to automatically convert all of the shaders to be cross-compatible with Vulkan. And change the graphic pack versions to version 4 of course. Also, the script has some nifty testing code which compiled every shader as OpenGL and Vulkan, but for that see the details that I've written below. Here's the script that I've made to do all of this. No manual edits were needed: https://gist.github.com/Crementif/8d98a855b95f219d95298fb3db99deae 2019-11-29 04:36:05 +01:00			`#ifdef VULKAN`
			`layout(set = 1, binding = 1) uniform ufBlock`
			`{`
			`uniform vec4 uf_fragCoordScale;`
			`};`
			`#else`
New super mario bros 1..4.x - Rules n shaders 2018-10-31 18:48:11 +01:00			`uniform vec2 uf_fragCoordScale;`
Update every graphic pack to V4 Since it's not possible to update 300+ shaders manually and automation was possible, I thought that I'd take the honor and create a script that's able to automatically convert all of the shaders to be cross-compatible with Vulkan. And change the graphic pack versions to version 4 of course. Also, the script has some nifty testing code which compiled every shader as OpenGL and Vulkan, but for that see the details that I've written below. Here's the script that I've made to do all of this. No manual edits were needed: https://gist.github.com/Crementif/8d98a855b95f219d95298fb3db99deae 2019-11-29 04:36:05 +01:00			`#endif`
New super mario bros 1..4.x - Rules n shaders 2018-10-31 18:48:11 +01:00
			`// FabriceNeyret2 CC, single shader gaussian by intermediate MIPmap level. www.shadertoy.com/view/ltScRG`
			`const int samples = 8 * sampleScale, //8 or 4 balances xy position`
			`LOD = 2, // gaussian done on MIPmap at scale LOD`
			`sLOD = 1 << LOD; // tile size = 2^LOD`
			`const float sigma = float(samples) * .25;`

			`float gaussian(vec2 i) {`
			`return exp(-.5* dot(i /= sigma, i)) / (6.28 * sigma*sigma);`
			`}`

			`vec4 blur(sampler2D sp, vec2 U, vec2 scale) {`
			`vec4 O = vec4(0.0);`
			`int s = samples / sLOD;`

			`for (int i = 0; i < s*s; i++) {`
			`vec2 d = vec2(i%s, i / s)*float(sLOD) - float(samples) / 2.;`
			`O += gaussian(d) * textureLod(sp, U + scale * d, float(LOD));`
			`}`

			`//O / O.a;`
[NSMBU] Default to basic build / move custom shaders to Enhancements 2019-01-10 00:34:19 +01:00			`return vec4(O.x, O.y, O.z, 0.0)*18; //16 exact, 17 ~ a touch more haze to compensate res increase`
New super mario bros 1..4.x - Rules n shaders 2018-10-31 18:48:11 +01:00			`}`

			`int clampFI32(int v)`
			`{`
			`if( v == 0x7FFFFFFF )`
			`return floatBitsToInt(1.0);`
			`else if( v == 0xFFFFFFFF )`
			`return floatBitsToInt(0.0);`
			`return floatBitsToInt(clamp(intBitsToFloat(v), 0.0, 1.0));`
			`}`
			`float mul_nonIEEE(float a, float b){return mix(0.0, a*b, (a != 0.0) && (b != 0.0));}`
			`void main()`
			`{`
			`vec4 R0f = vec4(0.0);`
			`vec4 R1f = vec4(0.0);`
			`vec4 R2f = vec4(0.0);`
			`vec4 R3f = vec4(0.0);`
			`vec4 R123f = vec4(0.0);`
			`float backupReg0f, backupReg1f, backupReg2f, backupReg3f, backupReg4f;`
			`vec4 PV0f = vec4(0.0), PV1f = vec4(0.0);`
			`float PS0f = 0.0, PS1f = 0.0;`
			`vec4 tempf = vec4(0.0);`
			`float tempResultf;`
			`int tempResulti;`
			`ivec4 ARi = ivec4(0);`
			`bool predResult = true;`
			`vec3 cubeMapSTM;`
			`int cubeMapFaceId;`
			`R0f = passParameterSem3;`

			`vec2 coord = passParameterSem3.xy*textureSize(textureUnitPS0, 0); //`
			`vec2 ps = vec2(1.0) / textureSize(textureUnitPS0, 0);`
			`vec2 uv = coord * ps;`

			`R1f.xyz = blur(textureUnitPS0, R0f.xy, ps*scaleBlur).xyz;`
			`R2f.xyz = R1f.xyz;`
			`R3f.xyz = R1f.xyz;`
			`R0f.xyz = R1f.xyz;`
			`/*`
			`R1f.xyz = (texture(textureUnitPS0, R0f.xy).xyz);`
			`R2f.xyz = (texture(textureUnitPS0, R0f.zy).xyz);`
			`R3f.xyz = (texture(textureUnitPS0, R0f.xw).xyz);`
			`R0f.xyz = (texture(textureUnitPS0, R0f.zw).xyz);`
			`*/`

			`// 0`
			`PV0f.x = R1f.z + R2f.z;`
			`PV0f.x /= 2.0;`
			`PV0f.z = R1f.y + R2f.y;`
			`PV0f.z /= 2.0;`
			`PV0f.w = R1f.x + R2f.x;`
			`PV0f.w /= 2.0;`
			`// 1`
			`R123f.x = (R3f.y * 0.5 + PV0f.z);`
			`PV1f.x = R123f.x;`
			`R123f.y = (R3f.x * 0.5 + PV0f.w);`
			`PV1f.y = R123f.y;`
			`R123f.w = (R3f.z * 0.5 + PV0f.x);`
			`PV1f.w = R123f.w;`
			`// 2`
			`backupReg0f = R0f.x;`
			`backupReg1f = R0f.y;`
			`backupReg2f = R0f.z;`
			`R0f.x = (backupReg0f * 0.5 + PV1f.y)/2.0;`
			`R0f.y = (backupReg1f * 0.5 + PV1f.x)/2.0;`
			`R0f.z = (backupReg2f * 0.5 + PV1f.w)/2.0;`
			`// export`
			`passPixelColor0 = vec4(R0f.x, R0f.y, R0f.z, R0f.w);`
			`}`