bicubic_scale.effect 5.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236
  1. /*
  2. * bicubic sharper (better for downscaling)
  3. * note - this shader is adapted from the GPL bsnes shader, very good stuff
  4. * there.
  5. */
  6. #include "color.effect"
  7. uniform float4x4 ViewProj;
  8. uniform texture2d image;
  9. uniform float2 base_dimension;
  10. uniform float2 base_dimension_i;
  11. uniform float undistort_factor = 1.0;
  12. uniform float multiplier;
  13. sampler_state textureSampler {
  14. Filter = Linear;
  15. AddressU = Clamp;
  16. AddressV = Clamp;
  17. };
  18. struct VertData {
  19. float4 pos : POSITION;
  20. float2 uv : TEXCOORD0;
  21. };
  22. struct VertOut {
  23. float2 uv : TEXCOORD0;
  24. float4 pos : POSITION;
  25. };
  26. struct FragData {
  27. float2 uv : TEXCOORD0;
  28. };
  29. VertOut VSDefault(VertData v_in)
  30. {
  31. VertOut vert_out;
  32. vert_out.uv = v_in.uv * base_dimension;
  33. vert_out.pos = mul(float4(v_in.pos.xyz, 1.0), ViewProj);
  34. return vert_out;
  35. }
  36. float4 weight4(float x)
  37. {
  38. /* Sharper version. May look better in some cases. B=0, C=0.75 */
  39. return float4(
  40. ((-0.75 * x + 1.5) * x - 0.75) * x,
  41. (1.25 * x - 2.25) * x * x + 1.0,
  42. ((-1.25 * x + 1.5) * x + 0.75) * x,
  43. (0.75 * x - 0.75) * x * x);
  44. }
  45. float AspectUndistortX(float x, float a)
  46. {
  47. // The higher the power, the longer the linear part will be.
  48. return (1.0 - a) * (x * x * x * x * x) + a * x;
  49. }
  50. float AspectUndistortU(float u)
  51. {
  52. // Normalize texture coord to -1.0 to 1.0 range, and back.
  53. return AspectUndistortX((u - 0.5) * 2.0, undistort_factor) * 0.5 + 0.5;
  54. }
  55. float2 undistort_coord(float xpos, float ypos)
  56. {
  57. return float2(AspectUndistortU(xpos), ypos);
  58. }
  59. float4 undistort_pixel(float xpos, float ypos)
  60. {
  61. return image.Sample(textureSampler, undistort_coord(xpos, ypos));
  62. }
  63. float4 undistort_line(float4 xpos, float ypos, float4 rowtaps)
  64. {
  65. return undistort_pixel(xpos.x, ypos) * rowtaps.x +
  66. undistort_pixel(xpos.y, ypos) * rowtaps.y +
  67. undistort_pixel(xpos.z, ypos) * rowtaps.z +
  68. undistort_pixel(xpos.w, ypos) * rowtaps.w;
  69. }
  70. float4 DrawBicubic(FragData f_in, bool undistort)
  71. {
  72. float2 pos = f_in.uv;
  73. float2 pos1 = floor(pos - 0.5) + 0.5;
  74. float2 f = pos - pos1;
  75. float4 rowtaps = weight4(f.x);
  76. float4 coltaps = weight4(f.y);
  77. float2 uv1 = pos1 * base_dimension_i;
  78. float2 uv0 = uv1 - base_dimension_i;
  79. float2 uv2 = uv1 + base_dimension_i;
  80. float2 uv3 = uv2 + base_dimension_i;
  81. if (undistort) {
  82. float4 xpos = float4(uv0.x, uv1.x, uv2.x, uv3.x);
  83. return undistort_line(xpos, uv0.y, rowtaps) * coltaps.x +
  84. undistort_line(xpos, uv1.y, rowtaps) * coltaps.y +
  85. undistort_line(xpos, uv2.y, rowtaps) * coltaps.z +
  86. undistort_line(xpos, uv3.y, rowtaps) * coltaps.w;
  87. }
  88. float u_weight_sum = rowtaps.y + rowtaps.z;
  89. float u_middle_offset = rowtaps.z * base_dimension_i.x / u_weight_sum;
  90. float u_middle = uv1.x + u_middle_offset;
  91. float v_weight_sum = coltaps.y + coltaps.z;
  92. float v_middle_offset = coltaps.z * base_dimension_i.y / v_weight_sum;
  93. float v_middle = uv1.y + v_middle_offset;
  94. int2 coord_top_left = int2(max(uv0 * base_dimension, 0.5));
  95. int2 coord_bottom_right = int2(min(uv3 * base_dimension, base_dimension - 0.5));
  96. float4 top = image.Load(int3(coord_top_left, 0)) * rowtaps.x;
  97. top += image.Sample(textureSampler, float2(u_middle, uv0.y)) * u_weight_sum;
  98. top += image.Load(int3(coord_bottom_right.x, coord_top_left.y, 0)) * rowtaps.w;
  99. float4 total = top * coltaps.x;
  100. float4 middle = image.Sample(textureSampler, float2(uv0.x, v_middle)) * rowtaps.x;
  101. middle += image.Sample(textureSampler, float2(u_middle, v_middle)) * u_weight_sum;
  102. middle += image.Sample(textureSampler, float2(uv3.x, v_middle)) * rowtaps.w;
  103. total += middle * v_weight_sum;
  104. float4 bottom = image.Load(int3(coord_top_left.x, coord_bottom_right.y, 0)) * rowtaps.x;
  105. bottom += image.Sample(textureSampler, float2(u_middle, uv3.y)) * u_weight_sum;
  106. bottom += image.Load(int3(coord_bottom_right, 0)) * rowtaps.w;
  107. total += bottom * coltaps.w;
  108. return total;
  109. }
  110. float4 PSDrawBicubicRGBA(FragData f_in, bool undistort) : TARGET
  111. {
  112. return DrawBicubic(f_in, undistort);
  113. }
  114. float4 PSDrawBicubicRGBAMultiply(FragData f_in, bool undistort) : TARGET
  115. {
  116. float4 rgba = DrawBicubic(f_in, undistort);
  117. rgba.rgb *= multiplier;
  118. return rgba;
  119. }
  120. float4 PSDrawBicubicRGBATonemap(FragData f_in, bool undistort) : TARGET
  121. {
  122. float4 rgba = DrawBicubic(f_in, undistort);
  123. rgba.rgb = rec709_to_rec2020(rgba.rgb);
  124. rgba.rgb = reinhard(rgba.rgb);
  125. rgba.rgb = rec2020_to_rec709(rgba.rgb);
  126. return rgba;
  127. }
  128. float4 PSDrawBicubicRGBAMultiplyTonemap(FragData f_in, bool undistort) : TARGET
  129. {
  130. float4 rgba = DrawBicubic(f_in, undistort);
  131. rgba.rgb *= multiplier;
  132. rgba.rgb = rec709_to_rec2020(rgba.rgb);
  133. rgba.rgb = reinhard(rgba.rgb);
  134. rgba.rgb = rec2020_to_rec709(rgba.rgb);
  135. return rgba;
  136. }
  137. technique Draw
  138. {
  139. pass
  140. {
  141. vertex_shader = VSDefault(v_in);
  142. pixel_shader = PSDrawBicubicRGBA(f_in, false);
  143. }
  144. }
  145. technique DrawMultiply
  146. {
  147. pass
  148. {
  149. vertex_shader = VSDefault(v_in);
  150. pixel_shader = PSDrawBicubicRGBAMultiply(f_in, false);
  151. }
  152. }
  153. technique DrawTonemap
  154. {
  155. pass
  156. {
  157. vertex_shader = VSDefault(v_in);
  158. pixel_shader = PSDrawBicubicRGBATonemap(f_in, false);
  159. }
  160. }
  161. technique DrawMultiplyTonemap
  162. {
  163. pass
  164. {
  165. vertex_shader = VSDefault(v_in);
  166. pixel_shader = PSDrawBicubicRGBAMultiplyTonemap(f_in, false);
  167. }
  168. }
  169. technique DrawUndistort
  170. {
  171. pass
  172. {
  173. vertex_shader = VSDefault(v_in);
  174. pixel_shader = PSDrawBicubicRGBA(f_in, true);
  175. }
  176. }
  177. technique DrawUndistortMultiply
  178. {
  179. pass
  180. {
  181. vertex_shader = VSDefault(v_in);
  182. pixel_shader = PSDrawBicubicRGBAMultiply(f_in, true);
  183. }
  184. }
  185. technique DrawUndistortTonemap
  186. {
  187. pass
  188. {
  189. vertex_shader = VSDefault(v_in);
  190. pixel_shader = PSDrawBicubicRGBATonemap(f_in, true);
  191. }
  192. }
  193. technique DrawUndistortMultiplyTonemap
  194. {
  195. pass
  196. {
  197. vertex_shader = VSDefault(v_in);
  198. pixel_shader = PSDrawBicubicRGBAMultiplyTonemap(f_in, true);
  199. }
  200. }