diff options
author | dec05eba <dec05eba@protonmail.com> | 2025-03-30 03:36:39 +0200 |
---|---|---|
committer | dec05eba <dec05eba@protonmail.com> | 2025-03-30 03:36:39 +0200 |
commit | c679b2fdb6a8172df4e29b1fb12b54d1891665de (patch) | |
tree | 7f49ffb957e84d264e9cd59d569a2d3d437c6d11 | |
parent | b8a521a785e1c40ef247e6536f284afd9e39922a (diff) |
Use sampler2D for alpha blending compute shader instead of output image2D
-rw-r--r-- | TODO | 2 | ||||
-rw-r--r-- | include/egl.h | 4 | ||||
-rw-r--r-- | src/color_conversion.c | 42 | ||||
-rw-r--r-- | src/egl.c | 2 |
4 files changed, 36 insertions, 14 deletions
@@ -251,4 +251,4 @@ Support spanning multiple monitors with region capture. This would also allow th When webcam support is added also support v4l2loopback? this is done by using avdevice_register_all(); and -c v4l2 -o /dev/video0; but it needs to output raw data as well instead of h264 and possibly yuv420p. Maybe add a -k yuv420p option to do that. -Do proper exit, to call gsr_capture_destroy which will properly stop gsr-kms-server. Otherwise there can be zombie gsr-kms-server on error.
\ No newline at end of file +Do proper exit, to call gsr_capture_destroy which will properly stop gsr-kms-server. Otherwise there can be zombie gsr-kms-server on error. diff --git a/include/egl.h b/include/egl.h index 643ab30..f7b0cc1 100644 --- a/include/egl.h +++ b/include/egl.h @@ -139,6 +139,8 @@ typedef void(*__GLXextFuncPtr)(void); #define GL_WRITE_ONLY 0x88B9 #define GL_READ_WRITE 0x88BA #define GL_MAX_COMPUTE_FIXED_GROUP_INVOCATIONS 0x90EB +#define GL_TEXTURE0 0x84C0 +#define GL_TEXTURE1 0x84C1 #define GL_VENDOR 0x1F00 #define GL_RENDERER 0x1F01 @@ -236,6 +238,7 @@ struct gsr_egl { void (*glClearColor)(float red, float green, float blue, float alpha); void (*glGenTextures)(int n, unsigned int *textures); void (*glDeleteTextures)(int n, const unsigned int *texture); + void (*glActiveTexture)(unsigned int texture); void (*glBindTexture)(unsigned int target, unsigned int texture); void (*glBindImageTexture)(unsigned int unit, unsigned int texture, int level, unsigned char layered, int layer, unsigned int access, unsigned int format); void (*glTexParameteri)(unsigned int target, unsigned int pname, int param); @@ -285,6 +288,7 @@ struct gsr_egl { int (*glGetUniformLocation)(unsigned int program, const char *name); void (*glUniform1f)(int location, float v0); void (*glUniform2f)(int location, float v0, float v1); + void (*glUniform1i)(int location, int v0); void (*glUniform2i)(int location, int v0, int v1); void (*glUniformMatrix2fv)(int location, int count, unsigned char transpose, const float *value); void (*glDebugMessageCallback)(GLDEBUGPROC callback, const void *userParam); diff --git a/src/color_conversion.c b/src/color_conversion.c index 72390f5..e33b7b9 100644 --- a/src/color_conversion.c +++ b/src/color_conversion.c @@ -86,12 +86,13 @@ static int load_compute_shader_y(gsr_shader *shader, gsr_egl *egl, gsr_color_uni snprintf(compute_shader, sizeof(compute_shader), "#version 430 core\n" "layout (local_size_x = %d, local_size_y = %d, local_size_z = 1) in;\n" - "uniform sampler2D imgInput;\n" + "layout(binding = 0) uniform sampler2D imgInput;\n" + "layout(binding = 1) uniform sampler2D imgBackground;\n" "uniform ivec2 source_position;\n" "uniform ivec2 target_position;\n" "uniform vec2 scale;\n" "uniform mat2 rotation_matrix;\n" - "layout(%s, binding = 0) uniform image2D imgOutput;\n" + "layout(%s, binding = 0) writeonly uniform image2D imgOutput;\n" "%s" "void main() {\n" " ivec2 texelCoord = ivec2(gl_GlobalInvocationID.xy);\n" @@ -100,7 +101,7 @@ static int load_compute_shader_y(gsr_shader *shader, gsr_egl *egl, gsr_color_uni " vec2 texCoord = vec2(rotated_texel_coord)/vec2(size);\n" " vec4 source_color = texture(imgInput, texCoord);\n" " vec4 source_color_yuv = RGBtoYUV * vec4(source_color.rgb, 1.0);\n" - " vec4 output_color_yuv = imageLoad(imgOutput, ivec2(rotated_texel_coord) + target_position);\n" + " vec4 output_color_yuv = texture(imgBackground, (rotated_texel_coord + vec2(target_position))/vec2(textureSize(imgBackground, 0)));\n" " float y_color = mix(output_color_yuv.r, source_color_yuv.r, source_color.a);\n" " imageStore(imgOutput, texelCoord + target_position, vec4(y_color, 1.0, 1.0, 1.0));\n" "}\n", max_local_size_dim, max_local_size_dim, use_16bit_colors ? "r16" : "r8", color_transform_matrix); @@ -123,12 +124,13 @@ static int load_compute_shader_uv(gsr_shader *shader, gsr_egl *egl, gsr_color_un snprintf(compute_shader, sizeof(compute_shader), "#version 430 core\n" "layout (local_size_x = %d, local_size_y = %d, local_size_z = 1) in;\n" - "uniform sampler2D imgInput;\n" + "layout(binding = 0) uniform sampler2D imgInput;\n" + "layout(binding = 1) uniform sampler2D imgBackground;\n" "uniform ivec2 source_position;\n" "uniform ivec2 target_position;\n" "uniform vec2 scale;\n" "uniform mat2 rotation_matrix;\n" - "layout(%s, binding = 0) uniform image2D imgOutput;\n" + "layout(%s, binding = 0) writeonly uniform image2D imgOutput;\n" "%s" "void main() {\n" " ivec2 texelCoord = ivec2(gl_GlobalInvocationID.xy);\n" @@ -137,7 +139,7 @@ static int load_compute_shader_uv(gsr_shader *shader, gsr_egl *egl, gsr_color_un " vec2 texCoord = vec2(rotated_texel_coord)/vec2(size);\n" " vec4 source_color = texture(imgInput, texCoord * 2.0);\n" " vec4 source_color_yuv = RGBtoYUV * vec4(source_color.rgb, 1.0);\n" - " vec4 output_color_yuv = imageLoad(imgOutput, ivec2(rotated_texel_coord) + target_position/2);\n" + " vec4 output_color_yuv = texture(imgBackground, (rotated_texel_coord + vec2(target_position/2))/vec2(textureSize(imgBackground, 0)));\n" " vec2 uv_color = mix(output_color_yuv.rg, source_color_yuv.gb, source_color.a);\n" " imageStore(imgOutput, texelCoord + target_position/2, vec4(uv_color, 1.0, 1.0));\n" "}\n", max_local_size_dim, max_local_size_dim, use_16bit_colors ? "rg16" : "rg8", color_transform_matrix); @@ -157,7 +159,8 @@ static int load_compute_shader_rgb(gsr_shader *shader, gsr_egl *egl, gsr_color_u snprintf(compute_shader, sizeof(compute_shader), "#version 430 core\n" "layout (local_size_x = %d, local_size_y = %d, local_size_z = 1) in;\n" - "uniform sampler2D imgInput;\n" + "layout(binding = 0) uniform sampler2D imgInput;\n" + "layout(binding = 1) uniform sampler2D imgBackground;\n" "uniform ivec2 source_position;\n" "uniform ivec2 target_position;\n" "uniform vec2 scale;\n" @@ -169,9 +172,9 @@ static int load_compute_shader_rgb(gsr_shader *shader, gsr_egl *egl, gsr_color_u " vec2 rotated_texel_coord = vec2(texelCoord - source_position - size/2) * rotation_matrix + vec2(size/2) + 0.5;\n" " vec2 texCoord = vec2(rotated_texel_coord)/vec2(size);\n" " vec4 source_color = texture(imgInput, texCoord);\n" - //" vec4 output_color = imageLoad(imgOutput, ivec2(rotated_texel_coord) + target_position);\n" - //" vec3 color = mix(output_color.rgb, source_color.rgb, source_color.a);\n" - " imageStore(imgOutput, texelCoord + target_position, source_color);\n" + " vec4 output_color = texture(imgBackground, (rotated_texel_coord + vec2(target_position))/vec2(textureSize(imgBackground, 0)));\n" + " vec3 color = mix(output_color.rgb, source_color.rgb, source_color.a);\n" + " imageStore(imgOutput, texelCoord + target_position, vec4(color, 1.0));\n" "}\n", max_local_size_dim, max_local_size_dim); if(gsr_shader_init(shader, egl, NULL, NULL, compute_shader) != 0) @@ -378,6 +381,11 @@ void gsr_color_conversion_draw(gsr_color_conversion *self, unsigned int texture_ case GSR_DESTINATION_COLOR_NV12: case GSR_DESTINATION_COLOR_P010: { const bool use_16bit_colors = self->params.destination_color == GSR_DESTINATION_COLOR_P010; + + self->params.egl->glActiveTexture(GL_TEXTURE1); + self->params.egl->glBindTexture(GL_TEXTURE_2D, self->params.destination_textures[0]); + self->params.egl->glActiveTexture(GL_TEXTURE0); + // Y { gsr_shader_use(&self->shaders[0]); @@ -385,12 +393,16 @@ void gsr_color_conversion_draw(gsr_color_conversion *self, unsigned int texture_ self->params.egl->glUniform2i(self->uniforms[0].source_position, source_position.x, source_position.y); self->params.egl->glUniform2i(self->uniforms[0].target_position, destination_pos.x, destination_pos.y); self->params.egl->glUniform2f(self->uniforms[0].scale, scale.x, scale.y); - self->params.egl->glBindImageTexture(0, self->params.destination_textures[0], 0, GL_FALSE, 0, GL_READ_WRITE, use_16bit_colors ? GL_R16 : GL_R8); + self->params.egl->glBindImageTexture(0, self->params.destination_textures[0], 0, GL_FALSE, 0, GL_WRITE_ONLY, use_16bit_colors ? GL_R16 : GL_R8); const double num_groups_x = (double)texture_size.x/(double)self->max_local_size_dim + 0.5; const double num_groups_y = (double)texture_size.y/(double)self->max_local_size_dim + 0.5; self->params.egl->glDispatchCompute(max_int(1, num_groups_x), max_int(1, num_groups_y), 1); } + self->params.egl->glActiveTexture(GL_TEXTURE1); + self->params.egl->glBindTexture(GL_TEXTURE_2D, self->params.destination_textures[1]); + self->params.egl->glActiveTexture(GL_TEXTURE0); + // UV { gsr_shader_use(&self->shaders[1]); @@ -398,7 +410,7 @@ void gsr_color_conversion_draw(gsr_color_conversion *self, unsigned int texture_ self->params.egl->glUniform2i(self->uniforms[1].source_position, source_position.x, source_position.y); self->params.egl->glUniform2i(self->uniforms[1].target_position, destination_pos.x, destination_pos.y); self->params.egl->glUniform2f(self->uniforms[1].scale, scale.x, scale.y); - self->params.egl->glBindImageTexture(0, self->params.destination_textures[1], 0, GL_FALSE, 0, GL_READ_WRITE, use_16bit_colors ? GL_RG16 : GL_RG8); + self->params.egl->glBindImageTexture(0, self->params.destination_textures[1], 0, GL_FALSE, 0, GL_WRITE_ONLY, use_16bit_colors ? GL_RG16 : GL_RG8); const double num_groups_x = (double)texture_size.x*0.5/(double)self->max_local_size_dim + 0.5; const double num_groups_y = (double)texture_size.y*0.5/(double)self->max_local_size_dim + 0.5; self->params.egl->glDispatchCompute(max_int(1, num_groups_x), max_int(1, num_groups_y), 1); @@ -406,12 +418,16 @@ void gsr_color_conversion_draw(gsr_color_conversion *self, unsigned int texture_ break; } case GSR_DESTINATION_COLOR_RGB8: { + self->params.egl->glActiveTexture(GL_TEXTURE1); + self->params.egl->glBindTexture(GL_TEXTURE_2D, self->params.destination_textures[0]); + self->params.egl->glActiveTexture(GL_TEXTURE0); + gsr_shader_use(&self->shaders[2]); self->params.egl->glUniformMatrix2fv(self->uniforms[2].rotation_matrix, 1, GL_TRUE, (const float*)rotation_matrix); self->params.egl->glUniform2i(self->uniforms[2].source_position, source_position.x, source_position.y); self->params.egl->glUniform2i(self->uniforms[2].target_position, destination_pos.x, destination_pos.y); self->params.egl->glUniform2f(self->uniforms[2].scale, scale.x, scale.y); - self->params.egl->glBindImageTexture(0, self->params.destination_textures[0], 0, GL_FALSE, 0, GL_READ_WRITE, GL_RGBA8); + self->params.egl->glBindImageTexture(0, self->params.destination_textures[0], 0, GL_FALSE, 0, GL_WRITE_ONLY, GL_RGBA8); const double num_groups_x = (double)texture_size.x/(double)self->max_local_size_dim + 0.5; const double num_groups_y = (double)texture_size.y/(double)self->max_local_size_dim + 0.5; self->params.egl->glDispatchCompute(max_int(1, num_groups_x), max_int(1, num_groups_y), 1); @@ -283,6 +283,7 @@ static bool gsr_egl_load_gl(gsr_egl *self, void *library) { { (void**)&self->glClearColor, "glClearColor" }, { (void**)&self->glGenTextures, "glGenTextures" }, { (void**)&self->glDeleteTextures, "glDeleteTextures" }, + { (void**)&self->glActiveTexture, "glActiveTexture" }, { (void**)&self->glBindTexture, "glBindTexture" }, { (void**)&self->glBindImageTexture, "glBindImageTexture" }, { (void**)&self->glTexParameteri, "glTexParameteri" }, @@ -332,6 +333,7 @@ static bool gsr_egl_load_gl(gsr_egl *self, void *library) { { (void**)&self->glGetUniformLocation, "glGetUniformLocation" }, { (void**)&self->glUniform1f, "glUniform1f" }, { (void**)&self->glUniform2f, "glUniform2f" }, + { (void**)&self->glUniform1i, "glUniform1i" }, { (void**)&self->glUniform2i, "glUniform2i" }, { (void**)&self->glUniformMatrix2fv, "glUniformMatrix2fv" }, { (void**)&self->glDebugMessageCallback, "glDebugMessageCallback" }, |