* Copyright (c) 2014, ArrayFire
* All rights reserved.
* This file is distributed under 3-clause BSD license.
* The complete license agreement can be obtained at:
#include <arrayfire.h>
#include <stdio.h>
#include <cstdlib>
using namespace af;
// use static variables at file scope so timeit() wrapper functions
// can reference image/kernels
// image to convolve
static array img;
// 5x5 derivative with separable kernels
static float h_dx[] = {1.f / 12, -8.f / 12, 0, 8.f / 12,
-1.f / 12}; // five point stencil
static float h_spread[] = {1.f / 5, 1.f / 5, 1.f / 5, 1.f / 5, 1.f / 5};
static array dx, spread, kernel; // device kernels
static array full_out, dsep_out, hsep_out; // save output for value checks
// wrapper functions for timeit() below
static void full() { full_out = convolve2(img, kernel); }
static void dsep() { dsep_out = convolve(dx, spread, img); }
static bool fail(array &left, array &right) {
return (max<float>(abs(left - right)) > 1e-6);
int main(int argc, char **argv) {
try {
int device = argc > 1 ? atoi(argv[1]) : 0;
// setup image and device copies of kernels
img = randu(640, 480);
dx = array(5, 1, h_dx); // 5x1 kernel
spread = array(1, 5, h_spread); // 1x5 kernel
kernel = matmul(dx, spread); // 5x5 kernel
printf("full 2D convolution: %.5f seconds\n", timeit(full));
printf("separable, device pointers: %.5f seconds\n", timeit(dsep));
// ensure values are all the same across versions
if (fail(full_out, dsep_out)) { throw af::exception("full != dsep"); }
} catch (af::exception &e) { fprintf(stderr, "%s\n", e.what()); }
return 0;
AFAPI array matmul(const array &lhs, const array &rhs, const matProp optLhs=AF_MAT_NONE, const matProp optRhs=AF_MAT_NONE)
Matrix multiply of two arrays.
AFAPI void info()
AFAPI void setDevice(const int device)
Sets the current device.
AFAPI array abs(const array &in)
C++ Interface for absolute value.
A multi dimensional data container.
Definition: array.h:35
Definition: algorithm.h:15
AFAPI double timeit(void(*fn)())
AFAPI array convolve2(const array &signal, const array &filter, const convMode mode=AF_CONV_DEFAULT, const convDomain domain=AF_CONV_AUTO)
C++ Interface for convolution on two dimensional signals.
static af::array array(af::dim4 idims, cl_mem buf, af::dtype type, bool retain=false)
Create an af::array object from an OpenCL cl_mem buffer.
Definition: opencl.h:327
AFAPI array randu(const dim4 &dims, const dtype ty, randomEngine &r)
An ArrayFire exception class.
Definition: exception.h:29
virtual const char * what() const
Returns an error message for the exception in a string format.
Definition: exception.h:60
AFAPI array convolve(const array &signal, const array &filter, const convMode mode=AF_CONV_DEFAULT, const convDomain domain=AF_CONV_AUTO)
C++ Interface for convolution any(one through three) dimensional signals.