45 C(0, shared vec4 cache[DIR(gl_WorkGroupSize) + FILTER_RADIUS*2 + 1]; )
47 C(0,
void distort(
const ivec2
pos,
const int idx) )
49 C(1,
const uint cp = DIR(gl_LocalInvocationID) + FILTER_RADIUS; )
51 C(1, cache[cp] = texture(input_img[idx], pos); )
53 C(1,
const ivec2 loc_l = pos - INC(FILTER_RADIUS); )
54 C(1, cache[cp - FILTER_RADIUS] = texture(input_img[idx], loc_l); )
56 C(1,
const ivec2 loc_h = pos + INC(DIR(gl_WorkGroupSize)); )
57 C(1, cache[cp + DIR(gl_WorkGroupSize)] = texture(input_img[idx], loc_h); )
61 C(1, vec4 sum = vec4(0); )
62 C(1,
for (
int p = -FILTER_RADIUS; p <= FILTER_RADIUS; p++) )
63 C(2, sum += cache[cp + p]; )
65 C(1, sum /= vec4(FILTER_RADIUS*2 + 1); )
66 C(1, imageStore(output_img[idx], pos, sum); )
81 .type = VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER,
84 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
89 .type = VK_DESCRIPTOR_TYPE_STORAGE_IMAGE,
91 .mem_quali =
"writeonly",
94 .stages = VK_SHADER_STAGE_COMPUTE_BIT,
114 VK_SHADER_STAGE_COMPUTE_BIT);
121 GLSLC(0, #define INC(x) (ivec2(x, 0)) );
122 GLSLC(0, #define DIR(var) (var.x) );
127 GLSLC(1,
const ivec2
pos = ivec2(gl_GlobalInvocationID.xy); );
132 if (s->
planes & (1 << i)) {
135 GLSLF(2, vec4 res = texture(input_img[%i],
pos); ,
i);
136 GLSLF(2, imageStore(output_img[%i],
pos, res); ,
i);
157 VK_SHADER_STAGE_COMPUTE_BIT);
164 GLSLC(0, #define INC(x) (ivec2(0, x)) );
165 GLSLC(0, #define DIR(var) (var.y) );
170 GLSLC(1,
const ivec2
pos = ivec2(gl_GlobalInvocationID.xy); );
175 if (s->
planes & (1 << i)) {
178 GLSLF(2, vec4 res = texture(input_img[%i],
pos); ,
i);
179 GLSLF(2, imageStore(output_img[%i],
pos, res); ,
i);
205 VkCommandBuffer cmd_buf;
232 s->
input_images[
i].imageLayout = VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL;
233 s->
tmp_images[
i].imageLayout = VK_IMAGE_LAYOUT_GENERAL;
241 VkImageMemoryBarrier bar[] = {
243 .sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,
245 .dstAccessMask = VK_ACCESS_SHADER_READ_BIT,
248 .srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
249 .dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
251 .subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT,
252 .subresourceRange.levelCount = 1,
253 .subresourceRange.layerCount = 1,
256 .sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,
258 .dstAccessMask = VK_ACCESS_SHADER_WRITE_BIT | VK_ACCESS_SHADER_READ_BIT,
259 .oldLayout =
tmp->layout[
i],
261 .srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
262 .dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
263 .image =
tmp->img[
i],
264 .subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT,
265 .subresourceRange.levelCount = 1,
266 .subresourceRange.layerCount = 1,
269 .sType = VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,
271 .dstAccessMask = VK_ACCESS_SHADER_WRITE_BIT,
274 .srcQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
275 .dstQueueFamilyIndex = VK_QUEUE_FAMILY_IGNORED,
276 .image = out->
img[
i],
277 .subresourceRange.aspectMask = VK_IMAGE_ASPECT_COLOR_BIT,
278 .subresourceRange.levelCount = 1,
279 .subresourceRange.layerCount = 1,
283 vkCmdPipelineBarrier(cmd_buf, VK_PIPELINE_STAGE_TOP_OF_PIPE_BIT,
284 VK_PIPELINE_STAGE_COMPUTE_SHADER_BIT, 0,
287 in->
layout[
i] = bar[0].newLayout;
288 in->
access[
i] = bar[0].dstAccessMask;
290 tmp->layout[
i] = bar[1].newLayout;
291 tmp->access[
i] = bar[1].dstAccessMask;
293 out->
layout[
i] = bar[2].newLayout;
294 out->
access[
i] = bar[2].dstAccessMask;
371 #define OFFSET(x) offsetof(AvgBlurVulkanContext, x) 372 #define FLAGS (AV_OPT_FLAG_FILTERING_PARAM | AV_OPT_FLAG_VIDEO_PARAM) 402 .
name =
"avgblur_vulkan",
408 .
inputs = avgblur_vulkan_inputs,
409 .
outputs = avgblur_vulkan_outputs,
410 .priv_class = &avgblur_vulkan_class,
int ff_vk_add_exec_dep(AVFilterContext *avctx, FFVkExecContext *e, AVFrame *frame, VkPipelineStageFlagBits in_wait_dst_flag)
Adds a frame as a queue dependency.
#define FF_FILTER_FLAG_HWFRAME_AWARE
The filter is aware of hardware frames, and any hardware frame context should not be automatically pr...
int ff_vk_init_pipeline_layout(AVFilterContext *avctx, VulkanPipeline *pl)
Initializes the pipeline layout after all shaders and descriptor sets have been finished.
VkDescriptorImageInfo tmp_images[3]
int ff_vk_add_descriptor_set(AVFilterContext *avctx, VulkanPipeline *pl, SPIRVShader *shd, VulkanDescriptorSetBinding *desc, int num, int only_print_to_shader)
Adds a descriptor set to the shader and registers them in the pipeline.
This structure describes decoded (raw) audio or video data.
void ff_vk_filter_uninit(AVFilterContext *avctx)
static const AVFilterPad avgblur_vulkan_outputs[]
const char * ff_vk_shader_rep_fmt(enum AVPixelFormat pixfmt)
Gets the glsl format string for a pixel format.
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
static av_cold int init(AVCodecContext *avctx)
int ff_vk_init_compute_pipeline(AVFilterContext *avctx, VulkanPipeline *pl)
Initializes a compute pipeline.
int h
agreed upon image height
static int avgblur_vulkan_filter_frame(AVFilterLink *link, AVFrame *in)
int ff_vk_create_imageview(AVFilterContext *avctx, FFVkExecContext *e, VkImageView *v, VkImage img, VkFormat fmt, const VkComponentMapping map)
Create an imageview.
int ff_vk_filter_config_output(AVFilterLink *outlink)
int ff_vk_start_exec_recording(AVFilterContext *avctx, FFVkExecContext *e)
Begin recording to the command buffer.
static const char blur_kernel[]
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
const VkFormat * av_vkfmt_from_pixfmt(enum AVPixelFormat p)
Returns the format of each image up to the number of planes for a given sw_format.
VkImage img[AV_NUM_DATA_POINTERS]
Vulkan images to which the memory is bound to.
const char * name
Pad name.
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
static av_cold int uninit(AVCodecContext *avctx)
VkDescriptorImageInfo output_images[3]
void ff_vk_set_compute_shader_sizes(AVFilterContext *avctx, SPIRVShader *shd, int local_size[3])
Writes the workgroup size for a shader.
int queue_family_comp_index
Queue family index for compute ops, and the amount of queues enabled.
int ff_vk_filter_init(AVFilterContext *avctx)
A filter pad used for either input or output.
A link between two filters.
int ff_vk_filter_query_formats(AVFilterContext *avctx)
General lavfi IO functions.
#define i(width, name, range_min, range_max)
enum AVPixelFormat input_format
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
void * priv
private data for use by the filter
int w
agreed upon image width
VkSampler * ff_vk_init_sampler(AVFilterContext *avctx, int unnorm_coords, VkFilter filt)
Create a Vulkan sampler, will be auto-freed in ff_vk_filter_uninit()
int ff_vk_create_exec_ctx(AVFilterContext *avctx, FFVkExecContext **ctx)
Init an execution context for command recording and queue submission.
static int process_frames(AVFilterContext *avctx, AVFrame *out_f, AVFrame *tmp_f, AVFrame *in_f)
VkAccessFlagBits access[AV_NUM_DATA_POINTERS]
Updated after every barrier.
int ff_vk_submit_exec_queue(AVFilterContext *avctx, FFVkExecContext *e)
Submits a command buffer to the queue for execution.
int main(int argc, char *argv[])
AVFilter ff_vf_avgblur_vulkan
VulkanFilterContext vkctx
static const AVFilterPad inputs[]
void ff_vk_bind_pipeline_exec(AVFilterContext *avctx, FFVkExecContext *e, VulkanPipeline *pl)
Add a command to bind the completed pipeline and its descriptor sets.
static const AVFilterPad outputs[]
#define FF_ARRAY_ELEMS(a)
static const AVFilterPad avgblur_vulkan_inputs[]
const VkComponentMapping ff_comp_identity_map
static void avgblur_vulkan_uninit(AVFilterContext *avctx)
int ff_vk_compile_shader(AVFilterContext *avctx, SPIRVShader *shd, const char *entrypoint)
Compiles the shader, entrypoint must be set to "main".
VkDescriptorImageInfo input_images[3]
SPIRVShader * ff_vk_init_shader(AVFilterContext *avctx, VulkanPipeline *pl, const char *name, VkShaderStageFlags stage)
Inits a shader for a specific pipeline.
AVVulkanDeviceContext * hwctx
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(const int16_t *) pi >> 8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(const int32_t *) pi >> 24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(const float *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(const float *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(const float *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(const double *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(const double *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(const double *) pi *(1U<< 31)))) #define SET_CONV_FUNC_GROUP(ofmt, ifmt) static void set_generic_function(AudioConvert *ac) { } void ff_audio_convert_free(AudioConvert **ac) { if(! *ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);} AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enum AVSampleFormat out_fmt, enum AVSampleFormat in_fmt, int channels, int sample_rate, int apply_map) { AudioConvert *ac;int in_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) return NULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method !=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt) > 2) { ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc) { av_free(ac);return NULL;} return ac;} in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar) { ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar ? ac->channels :1;} else if(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;else ac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);return ac;} int ff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in) { int use_generic=1;int len=in->nb_samples;int p;if(ac->dc) { av_log(ac->avr, AV_LOG_TRACE, "%d samples - audio_convert: %s to %s (dithered)\", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));return ff_convert_dither(ac-> in
VulkanPipeline * ff_vk_create_pipeline(AVFilterContext *avctx)
Inits a pipeline.
static const AVOption avgblur_vulkan_options[]
const char * name
Filter name.
VkCommandBuffer ff_vk_get_exec_buf(AVFilterContext *avctx, FFVkExecContext *e)
Gets the command buffer to use for this submission from the exe context.
#define GET_QUEUE_COUNT(hwctx, graph, comp, tx)
AVFilterLink ** outputs
array of pointers to output links
void ff_vk_discard_exec_deps(AVFilterContext *avctx, FFVkExecContext *e)
Discards all queue dependencies.
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
AVFILTER_DEFINE_CLASS(avgblur_vulkan)
static int query_formats(AVFilterContext *ctx)
enum AVPixelFormat output_format
AVFilterContext * dst
dest filter
int ff_vk_filter_config_input(AVFilterLink *inlink)
VkImageLayout layout[AV_NUM_DATA_POINTERS]
uint32_t av_get_random_seed(void)
Get a seed to use in conjunction with random functions.
static av_cold int init_filter(AVFilterContext *ctx, AVFrame *in)
#define DUP_SAMPLER_ARRAY4(x)
#define AVERROR_EXTERNAL
Generic error in an external library.
int av_frame_copy_props(AVFrame *dst, const AVFrame *src)
Copy only "metadata" fields from src to dst.
void ff_vk_update_descriptor_set(AVFilterContext *avctx, VulkanPipeline *pl, int set_id)
Updates a descriptor set via the updaters defined.