lanczos_scale.effect 7.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292
  1. /*
  2. * lanczos sharper
  3. * note - this shader is adapted from the GPL bsnes shader, very good stuff
  4. * there.
  5. */
  6. #include "color.effect"
  7. uniform float4x4 ViewProj;
  8. uniform texture2d image;
  9. uniform float2 base_dimension;
  10. uniform float2 base_dimension_i;
  11. uniform float undistort_factor = 1.0;
  12. uniform float multiplier;
  13. sampler_state textureSampler
  14. {
  15. AddressU = Clamp;
  16. AddressV = Clamp;
  17. Filter = Linear;
  18. };
  19. struct VertData {
  20. float4 pos : POSITION;
  21. float2 uv : TEXCOORD0;
  22. };
  23. struct VertOut {
  24. float2 uv : TEXCOORD0;
  25. float4 pos : POSITION;
  26. };
  27. struct FragData {
  28. float2 uv : TEXCOORD0;
  29. };
  30. VertOut VSDefault(VertData v_in)
  31. {
  32. VertOut vert_out;
  33. vert_out.uv = v_in.uv * base_dimension;
  34. vert_out.pos = mul(float4(v_in.pos.xyz, 1.0), ViewProj);
  35. return vert_out;
  36. }
  37. float weight(float x)
  38. {
  39. float x_pi = x * 3.141592654;
  40. return 3.0 * sin(x_pi) * sin(x_pi * (1.0 / 3.0)) / (x_pi * x_pi);
  41. }
  42. void weight6(float f_neg, out float3 tap012, out float3 tap345)
  43. {
  44. tap012 = float3(
  45. weight(f_neg - 2.0),
  46. weight(f_neg - 1.0),
  47. min(1.0, weight(f_neg))); // Replace NaN with 1.0.
  48. tap345 = float3(
  49. weight(f_neg + 1.0),
  50. weight(f_neg + 2.0),
  51. weight(f_neg + 3.0));
  52. // Normalize weights
  53. float sum = tap012.x + tap012.y + tap012.z + tap345.x + tap345.y + tap345.z;
  54. float sum_i = 1.0 / sum;
  55. tap012 = tap012 * sum_i;
  56. tap345 = tap345 * sum_i;
  57. }
  58. float AspectUndistortX(float x, float a)
  59. {
  60. // The higher the power, the longer the linear part will be.
  61. return (1.0 - a) * (x * x * x * x * x) + a * x;
  62. }
  63. float AspectUndistortU(float u)
  64. {
  65. // Normalize texture coord to -1.0 to 1.0 range, and back.
  66. return AspectUndistortX((u - 0.5) * 2.0, undistort_factor) * 0.5 + 0.5;
  67. }
  68. float2 undistort_coord(float xpos, float ypos)
  69. {
  70. return float2(AspectUndistortU(xpos), ypos);
  71. }
  72. float4 undistort_pixel(float xpos, float ypos)
  73. {
  74. return image.Sample(textureSampler, undistort_coord(xpos, ypos));
  75. }
  76. float4 undistort_line(float3 xpos012, float3 xpos345, float ypos, float3 rowtap012,
  77. float3 rowtap345)
  78. {
  79. return
  80. undistort_pixel(xpos012.x, ypos) * rowtap012.x +
  81. undistort_pixel(xpos012.y, ypos) * rowtap012.y +
  82. undistort_pixel(xpos012.z, ypos) * rowtap012.z +
  83. undistort_pixel(xpos345.x, ypos) * rowtap345.x +
  84. undistort_pixel(xpos345.y, ypos) * rowtap345.y +
  85. undistort_pixel(xpos345.z, ypos) * rowtap345.z;
  86. }
  87. float4 DrawLanczos(FragData f_in, bool undistort)
  88. {
  89. float2 pos = f_in.uv;
  90. float2 pos2 = floor(pos - 0.5) + 0.5;
  91. float2 f_neg = pos2 - pos;
  92. float3 rowtap012, rowtap345;
  93. weight6(f_neg.x, rowtap012, rowtap345);
  94. float3 coltap012, coltap345;
  95. weight6(f_neg.y, coltap012, coltap345);
  96. float2 uv2 = pos2 * base_dimension_i;
  97. float2 uv1 = uv2 - base_dimension_i;
  98. float2 uv0 = uv1 - base_dimension_i;
  99. float2 uv3 = uv2 + base_dimension_i;
  100. float2 uv4 = uv3 + base_dimension_i;
  101. float2 uv5 = uv4 + base_dimension_i;
  102. if (undistort) {
  103. float3 xpos012 = float3(uv0.x, uv1.x, uv2.x);
  104. float3 xpos345 = float3(uv3.x, uv4.x, uv5.x);
  105. return undistort_line(xpos012, xpos345, uv0.y, rowtap012, rowtap345) * coltap012.x +
  106. undistort_line(xpos012, xpos345, uv1.y, rowtap012, rowtap345) * coltap012.y +
  107. undistort_line(xpos012, xpos345, uv2.y, rowtap012, rowtap345) * coltap012.z +
  108. undistort_line(xpos012, xpos345, uv3.y, rowtap012, rowtap345) * coltap345.x +
  109. undistort_line(xpos012, xpos345, uv4.y, rowtap012, rowtap345) * coltap345.y +
  110. undistort_line(xpos012, xpos345, uv5.y, rowtap012, rowtap345) * coltap345.z;
  111. }
  112. float u_weight_sum = rowtap012.z + rowtap345.x;
  113. float u_middle_offset = rowtap345.x * base_dimension_i.x / u_weight_sum;
  114. float u_middle = uv2.x + u_middle_offset;
  115. float v_weight_sum = coltap012.z + coltap345.x;
  116. float v_middle_offset = coltap345.x * base_dimension_i.y / v_weight_sum;
  117. float v_middle = uv2.y + v_middle_offset;
  118. float2 coord_limit = base_dimension - 0.5;
  119. float2 coord0_f = max(uv0 * base_dimension, 0.5);
  120. float2 coord1_f = max(uv1 * base_dimension, 0.5);
  121. float2 coord4_f = min(uv4 * base_dimension, coord_limit);
  122. float2 coord5_f = min(uv5 * base_dimension, coord_limit);
  123. int2 coord0 = int2(coord0_f);
  124. int2 coord1 = int2(coord1_f);
  125. int2 coord4 = int2(coord4_f);
  126. int2 coord5 = int2(coord5_f);
  127. float4 row0 = image.Load(int3(coord0, 0)) * rowtap012.x;
  128. row0 += image.Load(int3(coord1.x, coord0.y, 0)) * rowtap012.y;
  129. row0 += image.Sample(textureSampler, float2(u_middle, uv0.y)) * u_weight_sum;
  130. row0 += image.Load(int3(coord4.x, coord0.y, 0)) * rowtap345.y;
  131. row0 += image.Load(int3(coord5.x, coord0.y, 0)) * rowtap345.z;
  132. float4 total = row0 * coltap012.x;
  133. float4 row1 = image.Load(int3(coord0.x, coord1.y, 0)) * rowtap012.x;
  134. row1 += image.Load(int3(coord1.x, coord1.y, 0)) * rowtap012.y;
  135. row1 += image.Sample(textureSampler, float2(u_middle, uv1.y)) * u_weight_sum;
  136. row1 += image.Load(int3(coord4.x, coord1.y, 0)) * rowtap345.y;
  137. row1 += image.Load(int3(coord5.x, coord1.y, 0)) * rowtap345.z;
  138. total += row1 * coltap012.y;
  139. float4 row23 = image.Sample(textureSampler, float2(uv0.x, v_middle)) * rowtap012.x;
  140. row23 += image.Sample(textureSampler, float2(uv1.x, v_middle)) * rowtap012.y;
  141. row23 += image.Sample(textureSampler, float2(u_middle, v_middle)) * u_weight_sum;
  142. row23 += image.Sample(textureSampler, float2(uv4.x, v_middle)) * rowtap345.y;
  143. row23 += image.Sample(textureSampler, float2(uv5.x, v_middle)) * rowtap345.z;
  144. total += row23 * v_weight_sum;
  145. float4 row4 = image.Load(int3(coord0.x, coord4.y, 0)) * rowtap012.x;
  146. row4 += image.Load(int3(coord1.x, coord4.y, 0)) * rowtap012.y;
  147. row4 += image.Sample(textureSampler, float2(u_middle, uv4.y)) * u_weight_sum;
  148. row4 += image.Load(int3(coord4.x, coord4.y, 0)) * rowtap345.y;
  149. row4 += image.Load(int3(coord5.x, coord4.y, 0)) * rowtap345.z;
  150. total += row4 * coltap345.y;
  151. float4 row5 = image.Load(int3(coord0.x, coord5.y, 0)) * rowtap012.x;
  152. row5 += image.Load(int3(coord1.x, coord5.y, 0)) * rowtap012.y;
  153. row5 += image.Sample(textureSampler, float2(u_middle, uv5.y)) * u_weight_sum;
  154. row5 += image.Load(int3(coord4.x, coord5.y, 0)) * rowtap345.y;
  155. row5 += image.Load(int3(coord5, 0)) * rowtap345.z;
  156. total += row5 * coltap345.z;
  157. return total;
  158. }
  159. float4 PSDrawLanczosRGBA(FragData f_in, bool undistort) : TARGET
  160. {
  161. return DrawLanczos(f_in, undistort);
  162. }
  163. float4 PSDrawLanczosRGBAMultiply(FragData f_in, bool undistort) : TARGET
  164. {
  165. float4 rgba = DrawLanczos(f_in, undistort);
  166. rgba.rgb *= multiplier;
  167. return rgba;
  168. }
  169. float4 PSDrawLanczosRGBATonemap(FragData f_in, bool undistort) : TARGET
  170. {
  171. float4 rgba = DrawLanczos(f_in, undistort);
  172. rgba.rgb = rec709_to_rec2020(rgba.rgb);
  173. rgba.rgb = reinhard(rgba.rgb);
  174. rgba.rgb = rec2020_to_rec709(rgba.rgb);
  175. return rgba;
  176. }
  177. float4 PSDrawLanczosRGBAMultiplyTonemap(FragData f_in, bool undistort) : TARGET
  178. {
  179. float4 rgba = DrawLanczos(f_in, undistort);
  180. rgba.rgb *= multiplier;
  181. rgba.rgb = rec709_to_rec2020(rgba.rgb);
  182. rgba.rgb = reinhard(rgba.rgb);
  183. rgba.rgb = rec2020_to_rec709(rgba.rgb);
  184. return rgba;
  185. }
  186. technique Draw
  187. {
  188. pass
  189. {
  190. vertex_shader = VSDefault(v_in);
  191. pixel_shader = PSDrawLanczosRGBA(f_in, false);
  192. }
  193. }
  194. technique DrawMultiply
  195. {
  196. pass
  197. {
  198. vertex_shader = VSDefault(v_in);
  199. pixel_shader = PSDrawLanczosRGBAMultiply(f_in, false);
  200. }
  201. }
  202. technique DrawTonemap
  203. {
  204. pass
  205. {
  206. vertex_shader = VSDefault(v_in);
  207. pixel_shader = PSDrawLanczosRGBATonemap(f_in, false);
  208. }
  209. }
  210. technique DrawMultiplyTonemap
  211. {
  212. pass
  213. {
  214. vertex_shader = VSDefault(v_in);
  215. pixel_shader = PSDrawLanczosRGBAMultiplyTonemap(f_in, false);
  216. }
  217. }
  218. technique DrawUndistort
  219. {
  220. pass
  221. {
  222. vertex_shader = VSDefault(v_in);
  223. pixel_shader = PSDrawLanczosRGBA(f_in, true);
  224. }
  225. }
  226. technique DrawUndistortMultiply
  227. {
  228. pass
  229. {
  230. vertex_shader = VSDefault(v_in);
  231. pixel_shader = PSDrawLanczosRGBAMultiply(f_in, true);
  232. }
  233. }
  234. technique DrawUndistortTonemap
  235. {
  236. pass
  237. {
  238. vertex_shader = VSDefault(v_in);
  239. pixel_shader = PSDrawLanczosRGBATonemap(f_in, true);
  240. }
  241. }
  242. technique DrawUndistortMultiplyTonemap
  243. {
  244. pass
  245. {
  246. vertex_shader = VSDefault(v_in);
  247. pixel_shader = PSDrawLanczosRGBAMultiplyTonemap(f_in, true);
  248. }
  249. }