diff options
author | Danil Iashchenko <danyaschenko@gmail.com> | 2018-03-24 18:57:43 +0300 |
---|---|---|
committer | Mark Thompson <sw@jkqxz.net> | 2018-03-26 22:26:35 +0100 |
commit | 9f17875134754eef899aefd30500904635edec9e (patch) | |
tree | a6e51a9be496681756bc3633456eb9b9e287b563 /libavfilter/opencl | |
parent | cfe1a9d311de6c36641cf295004cdbc77d7b600c (diff) | |
download | ffmpeg-streaming-9f17875134754eef899aefd30500904635edec9e.zip ffmpeg-streaming-9f17875134754eef899aefd30500904635edec9e.tar.gz |
libavfilter: Add OpenCL convolution filter
Behaves like existing convolution filter.
Signed-off-by: Mark Thompson <sw@jkqxz.net>
Diffstat (limited to 'libavfilter/opencl')
-rw-r--r-- | libavfilter/opencl/convolution.cl | 45 |
1 files changed, 45 insertions, 0 deletions
diff --git a/libavfilter/opencl/convolution.cl b/libavfilter/opencl/convolution.cl new file mode 100644 index 0000000..03ef4ef --- /dev/null +++ b/libavfilter/opencl/convolution.cl @@ -0,0 +1,45 @@ +/* + * Copyright (c) 2018 Danil Iashchenko + * + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +__kernel void convolution_global(__write_only image2d_t dst, + __read_only image2d_t src, + int coef_matrix_dim, + __constant float *coef_matrix, + float div, + float bias) +{ + const sampler_t sampler = (CLK_NORMALIZED_COORDS_FALSE | + CLK_ADDRESS_CLAMP_TO_EDGE | + CLK_FILTER_NEAREST); + + const int half_matrix_dim = (coef_matrix_dim / 2); + int2 loc = (int2)(get_global_id(0), get_global_id(1)); + float4 convPix = (float4)(0.0f, 0.0f, 0.0f, 0.0f); + + for (int conv_i = -half_matrix_dim; conv_i <= half_matrix_dim; conv_i++) { + for (int conv_j = -half_matrix_dim; conv_j <= half_matrix_dim; conv_j++) { + float4 px = read_imagef(src, sampler, loc + (int2)(conv_j, conv_i)); + convPix += px * coef_matrix[(conv_i + half_matrix_dim) * coef_matrix_dim + + (conv_j + half_matrix_dim)]; + } + } + float4 dstPix = convPix * div + bias; + write_imagef(dst, loc, dstPix); +} |