Go to the documentation of this file.
25 #define CGROUPS (int [3]){ 32, 32, 1 }
52 C(1,
if ((o_offset[
i].x <=
pos.x) && (o_offset[
i].y <=
pos.y) &&
53 (
pos.x < (o_offset[
i].x + o_size[
i].x)) &&
54 (
pos.y < (o_offset[
i].y + o_size[
i].y))) { )
55 C(2, vec4 res = texture(overlay_img[i], pos - o_offset[i]); )
56 C(2, imageStore(output_img[i], pos, res); )
58 C(2, vec4 res = texture(main_img[i], pos); )
59 C(2, imageStore(output_img[i], pos, res); )
65 C(0,
void overlay_alpha_opaque(
int i, ivec2
pos) )
67 C(1, vec4 res = texture(main_img[
i],
pos); )
68 C(1,
if ((o_offset[
i].x <=
pos.x) && (o_offset[
i].y <=
pos.y) &&
69 (
pos.x < (o_offset[
i].x + o_size[
i].x)) &&
70 (
pos.y < (o_offset[
i].y + o_size[
i].y))) { )
71 C(2, vec4 ovr = texture(overlay_img[i], pos - o_offset[i]); )
72 C(2, res = ovr * ovr.a + res * (1.0f - ovr.a); )
74 C(2, imageStore(output_img[i], pos, res); )
76 C(1, imageStore(output_img[
i],
pos, res); )
104 .type = VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER,
107 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
108 .updater =
s->main_images,
112 .name =
"overlay_img",
113 .type = VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER,
116 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
117 .updater =
s->overlay_images,
121 .name =
"output_img",
122 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
124 .mem_quali =
"writeonly",
127 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
128 .updater =
s->output_images,
134 .type = VK_DESCRIPTOR_TYPE_STORAGE_BUFFER,
135 .mem_quali =
"readonly",
136 .mem_layout =
"std430",
137 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
138 .updater = &
s->params_desc,
139 .buf_content =
"ivec2 o_offset[3], o_size[3];",
143 VK_SHADER_STAGE_COMPUTE_BIT);
156 GLSLC(1, ivec2
pos = ivec2(gl_GlobalInvocationID.xy); );
160 GLSLC(2, overlay_alpha_opaque(
i,
pos); );
185 VK_BUFFER_USAGE_STORAGE_BUFFER_BIT,
186 VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT);
196 par->o_offset[0] =
s->overlay_x;
197 par->o_offset[1] =
s->overlay_y;
198 par->o_offset[2] = par->o_offset[0] >>
desc->log2_chroma_w;
199 par->o_offset[3] = par->o_offset[1] >>
desc->log2_chroma_h;
200 par->o_offset[4] = par->o_offset[0] >>
desc->log2_chroma_w;
201 par->o_offset[5] = par->o_offset[1] >>
desc->log2_chroma_h;
203 par->o_size[0] =
s->overlay_w;
204 par->o_size[1] =
s->overlay_h;
205 par->o_size[2] = par->o_size[0] >>
desc->log2_chroma_w;
206 par->o_size[3] = par->o_size[1] >>
desc->log2_chroma_h;
207 par->o_size[4] = par->o_size[0] >>
desc->log2_chroma_w;
208 par->o_size[5] = par->o_size[1] >>
desc->log2_chroma_h;
214 s->params_desc.buffer =
s->params_buf.buf;
215 s->params_desc.range = VK_WHOLE_SIZE;
235 VkCommandBuffer cmd_buf;
258 &
s->main_images[
i].imageView,
main->img[
i],
263 &
s->overlay_images[
i].imageView, overlay->
img[
i],
264 overlay_sw_formats[
i],
268 &
s->output_images[
i].imageView,
out->img[
i],
272 s->main_images[
i].imageLayout = VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL;
273 s->overlay_images[
i].imageLayout = VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL;
274 s->output_images[
i].imageLayout = VK_IMAGE_LAYOUT_GENERAL;
280 VkImageMemoryBarrier bar[3] = {
282 .sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,
284 .dstAccessMask = VK_ACCESS_SHADER_READ_BIT,
285 .oldLayout =
main->layout[
i],
286 .newLayout =
s->main_images[
i].imageLayout,
287 .srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
288 .dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
289 .image =
main->img[
i],
290 .subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT,
291 .subresourceRange.levelCount = 1,
292 .subresourceRange.layerCount = 1,
295 .sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,
297 .dstAccessMask = VK_ACCESS_SHADER_READ_BIT,
298 .oldLayout = overlay->
layout[
i],
299 .newLayout =
s->overlay_images[
i].imageLayout,
300 .srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
301 .dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
302 .image = overlay->
img[
i],
303 .subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT,
304 .subresourceRange.levelCount = 1,
305 .subresourceRange.layerCount = 1,
308 .sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,
310 .dstAccessMask = VK_ACCESS_SHADER_WRITE_BIT,
311 .oldLayout =
out->layout[
i],
312 .newLayout =
s->output_images[
i].imageLayout,
313 .srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
314 .dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
315 .image =
out->img[
i],
316 .subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT,
317 .subresourceRange.levelCount = 1,
318 .subresourceRange.layerCount = 1,
322 vk->CmdPipelineBarrier(cmd_buf, VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT,
323 VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT, 0,
326 main->layout[
i] = bar[0].newLayout;
327 main->access[
i] = bar[0].dstAccessMask;
329 overlay->
layout[
i] = bar[1].newLayout;
330 overlay->
access[
i] = bar[1].dstAccessMask;
332 out->layout[
i] = bar[2].newLayout;
333 out->access[
i] = bar[2].dstAccessMask;
338 vk->CmdDispatch(cmd_buf,
374 if (!input_main || !input_overlay)
377 if (!
s->initialized) {
380 if (main_fc->
sw_format != overlay_fc->sw_format) {
385 s->overlay_w = input_overlay->
width;
386 s->overlay_h = input_overlay->
height;
454 #define OFFSET(x) offsetof(OverlayVulkanContext, x)
455 #define FLAGS (AV_OPT_FLAG_FILTERING_PARAM | AV_OPT_FLAG_VIDEO_PARAM)
486 .
name =
"overlay_vulkan",
495 .priv_class = &overlay_vulkan_class,
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
int ff_framesync_configure(FFFrameSync *fs)
Configure a frame sync structure.
VkDescriptorBufferInfo params_desc
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
const VkComponentMapping ff_comp_identity_map
void ff_framesync_uninit(FFFrameSync *fs)
Free all memory currently allocated.
#define FF_FILTER_FLAG_HWFRAME_AWARE
The filter is aware of hardware frames, and any hardware frame context should not be automatically pr...
int ff_vk_create_buf(FFVulkanContext *s, FFVkBuffer *buf, size_t size, VkBufferUsageFlags usage, VkMemoryPropertyFlagBits flags)
Create a VkBuffer with the specified parameters.
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
uint8_t * data
The data buffer.
int ff_framesync_get_frame(FFFrameSync *fs, unsigned in, AVFrame **rframe, unsigned get)
Get the current frame in an input.
static const char overlay_noalpha[]
void ff_vk_bind_pipeline_exec(FFVulkanContext *s, FFVkExecContext *e, FFVulkanPipeline *pl)
Add a command to bind the completed pipeline and its descriptor sets.
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
This structure describes decoded (raw) audio or video data.
int ff_vk_filter_init(AVFilterContext *avctx)
General lavfi IO functions.
static int overlay_vulkan_activate(AVFilterContext *avctx)
int ff_vk_compile_shader(FFVulkanContext *s, FFVkSPIRVShader *shd, const char *entrypoint)
Compiles the shader, entrypoint must be set to "main".
static int overlay_vulkan_config_output(AVFilterLink *outlink)
static const AVFilterPad overlay_vulkan_outputs[]
void ff_vk_uninit(FFVulkanContext *s)
Frees the main Vulkan context.
const char * name
Filter name.
A link between two filters.
static int overlay_vulkan_blend(FFFrameSync *fs)
@ AV_PIX_FMT_VULKAN
Vulkan hardware images.
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
int ff_vk_add_exec_dep(FFVulkanContext *s, FFVkExecContext *e, AVFrame *frame, VkPipelineStageFlagBits in_wait_dst_flag)
Adds a frame as a queue dependency.
VkCommandBuffer ff_vk_get_exec_buf(FFVkExecContext *e)
Gets the command buffer to use for this submission from the exe context.
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
VkImage img[AV_NUM_DATA_POINTERS]
Vulkan images to which the memory is bound to.
void * priv
private data for use by the filter
const AVFilter ff_vf_overlay_vulkan
A filter pad used for either input or output.
s EdgeDetect Foobar g libavfilter vf_edgedetect c libavfilter vf_foobar c edit libavfilter and add an entry for foobar following the pattern of the other filters edit libavfilter allfilters and add an entry for foobar following the pattern of the other filters configure make j< whatever > ffmpeg ffmpeg i you should get a foobar png with Lena edge detected That s your new playground is ready Some little details about what s going which in turn will define variables for the build system and the C
void ff_vk_qf_init(FFVulkanContext *s, FFVkQueueFamilyCtx *qf, VkQueueFlagBits dev_family, int nb_queues)
Initialize a queue family with a specific number of queues.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
#define FF_ARRAY_ELEMS(a)
int ff_vk_create_imageview(FFVulkanContext *s, FFVkExecContext *e, VkImageView *v, VkImage img, VkFormat fmt, const VkComponentMapping map)
Create an imageview.
VkDescriptorImageInfo overlay_images[3]
FFVkSPIRVShader * ff_vk_init_shader(FFVulkanPipeline *pl, const char *name, VkShaderStageFlags stage)
Inits a shader for a specific pipeline.
#define AV_PIX_FMT_FLAG_ALPHA
The pixel format has an alpha channel.
static int process_frames(AVFilterContext *avctx, AVFrame *out_f, AVFrame *main_f, AVFrame *overlay_f)
static const AVOption overlay_vulkan_options[]
#define FILTER_INPUTS(array)
void ff_vk_update_descriptor_set(FFVulkanContext *s, FFVulkanPipeline *pl, int set_id)
Updates a descriptor set via the updaters defined.
int ff_vk_start_exec_recording(FFVulkanContext *s, FFVkExecContext *e)
Begin recording to the command buffer.
static av_cold int init_filter(AVFilterContext *ctx)
int main(int argc, char *argv[])
enum AVPixelFormat sw_format
The pixel format identifying the actual data layout of the hardware frames.
int av_frame_copy_props(AVFrame *dst, const AVFrame *src)
Copy only "metadata" fields from src to dst.
#define fs(width, name, subs,...)
static const AVFilterPad overlay_vulkan_inputs[]
filter_frame For filters that do not use the activate() callback
int ff_vk_create_exec_ctx(FFVulkanContext *s, FFVkExecContext **ctx, FFVkQueueFamilyCtx *qf)
Init an execution context for command recording and queue submission.
int ff_vk_filter_config_output(AVFilterLink *outlink)
void ff_vk_qf_rotate(FFVkQueueFamilyCtx *qf)
Rotate through the queues in a queue family.
VkDescriptorImageInfo main_images[3]
uint64_t flags
Combination of AV_PIX_FMT_FLAG_...
static const struct @328 planes[]
void ff_vk_discard_exec_deps(FFVkExecContext *e)
Discards all queue dependencies.
static av_cold int overlay_vulkan_init(AVFilterContext *avctx)
int ff_vk_unmap_buffers(FFVulkanContext *s, FFVkBuffer *buf, int nb_buffers, int flush)
Unmaps the buffer from userspace.
VkAccessFlagBits access[AV_NUM_DATA_POINTERS]
Updated after every barrier.
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
int ff_framesync_init_dualinput(FFFrameSync *fs, AVFilterContext *parent)
Initialize a frame sync structure for dualinput.
int ff_vk_init_pipeline_layout(FFVulkanContext *s, FFVulkanPipeline *pl)
Initializes the pipeline layout after all shaders and descriptor sets have been finished.
AVFilterContext * src
source filter
int ff_vk_submit_exec_queue(FFVulkanContext *s, FFVkExecContext *e)
Submits a command buffer to the queue for execution.
#define AVERROR_EXTERNAL
Generic error in an external library.
const VkFormat * av_vkfmt_from_pixfmt(enum AVPixelFormat p)
Returns the format of each image up to the number of planes for a given sw_format.
#define FILTER_SINGLE_PIXFMT(pix_fmt_)
int ff_vk_init_compute_pipeline(FFVulkanContext *s, FFVulkanPipeline *pl)
Initializes a compute pipeline.
#define i(width, name, range_min, range_max)
int w
agreed upon image width
static const char overlay_alpha[]
const char * ff_vk_shader_rep_fmt(enum AVPixelFormat pixfmt)
Gets the glsl format string for a pixel format.
const char * name
Pad name.
FFVulkanPipeline * ff_vk_create_pipeline(FFVulkanContext *s, FFVkQueueFamilyCtx *qf)
Inits a pipeline.
void ff_vk_free_buf(FFVulkanContext *s, FFVkBuffer *buf)
Frees a buffer.
AVFILTER_DEFINE_CLASS(overlay_vulkan)
This struct describes a set or pool of "hardware" frames (i.e.
AVBufferRef * hw_frames_ctx
For hwaccel-format frames, this should be a reference to the AVHWFramesContext describing the frame.
int ff_vk_add_descriptor_set(FFVulkanContext *s, FFVulkanPipeline *pl, FFVkSPIRVShader *shd, FFVulkanDescriptorSetBinding *desc, int num, int only_print_to_shader)
Adds a descriptor set to the shader and registers them in the pipeline.
int h
agreed upon image height
static void overlay_vulkan_uninit(AVFilterContext *avctx)
FFVkSampler * ff_vk_init_sampler(FFVulkanContext *s, int unnorm_coords, VkFilter filt)
Create a Vulkan sampler, will be auto-freed in ff_vk_filter_uninit()
VkDescriptorImageInfo output_images[3]
int ff_vk_filter_config_input(AVFilterLink *inlink)
VkImageLayout layout[AV_NUM_DATA_POINTERS]
int ff_vk_map_buffers(FFVulkanContext *s, FFVkBuffer *buf, uint8_t *mem[], int nb_buffers, int invalidate)
Maps the buffer to userspace.
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
#define FILTER_OUTPUTS(array)
void ff_vk_set_compute_shader_sizes(FFVkSPIRVShader *shd, int local_size[3])
Writes the workgroup size for a shader.
static av_cold int uninit(AVCodecContext *avctx)
int ff_framesync_activate(FFFrameSync *fs)
Examine the frames in the filter's input and try to produce output.