class cv::ocl::Kernel

Overview

#include <ocl.hpp>

class Kernel
{
public:
    // construction

    Kernel();

    Kernel(
        const char* kname,
        const Program& prog
        );

    Kernel(
        const char* kname,
        const ProgramSource& prog,
        const String& buildopts = String(),
        String* errmsg = 0
        );

    Kernel(const Kernel& k);

    // methods

    template <typename _Tp0>
    Kernel&
    args(const _Tp0& a0);

    template <
        typename _Tp0,
        typename _Tp1
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5,
        typename _Tp6
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5,
        const _Tp6& a6
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5,
        typename _Tp6,
        typename _Tp7
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5,
        const _Tp6& a6,
        const _Tp7& a7
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5,
        typename _Tp6,
        typename _Tp7,
        typename _Tp8
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5,
        const _Tp6& a6,
        const _Tp7& a7,
        const _Tp8& a8
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5,
        typename _Tp6,
        typename _Tp7,
        typename _Tp8,
        typename _Tp9
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5,
        const _Tp6& a6,
        const _Tp7& a7,
        const _Tp8& a8,
        const _Tp9& a9
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5,
        typename _Tp6,
        typename _Tp7,
        typename _Tp8,
        typename _Tp9,
        typename _Tp10
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5,
        const _Tp6& a6,
        const _Tp7& a7,
        const _Tp8& a8,
        const _Tp9& a9,
        const _Tp10& a10
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5,
        typename _Tp6,
        typename _Tp7,
        typename _Tp8,
        typename _Tp9,
        typename _Tp10,
        typename _Tp11
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5,
        const _Tp6& a6,
        const _Tp7& a7,
        const _Tp8& a8,
        const _Tp9& a9,
        const _Tp10& a10,
        const _Tp11& a11
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5,
        typename _Tp6,
        typename _Tp7,
        typename _Tp8,
        typename _Tp9,
        typename _Tp10,
        typename _Tp11,
        typename _Tp12
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5,
        const _Tp6& a6,
        const _Tp7& a7,
        const _Tp8& a8,
        const _Tp9& a9,
        const _Tp10& a10,
        const _Tp11& a11,
        const _Tp12& a12
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5,
        typename _Tp6,
        typename _Tp7,
        typename _Tp8,
        typename _Tp9,
        typename _Tp10,
        typename _Tp11,
        typename _Tp12,
        typename _Tp13
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5,
        const _Tp6& a6,
        const _Tp7& a7,
        const _Tp8& a8,
        const _Tp9& a9,
        const _Tp10& a10,
        const _Tp11& a11,
        const _Tp12& a12,
        const _Tp13& a13
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5,
        typename _Tp6,
        typename _Tp7,
        typename _Tp8,
        typename _Tp9,
        typename _Tp10,
        typename _Tp11,
        typename _Tp12,
        typename _Tp13,
        typename _Tp14
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5,
        const _Tp6& a6,
        const _Tp7& a7,
        const _Tp8& a8,
        const _Tp9& a9,
        const _Tp10& a10,
        const _Tp11& a11,
        const _Tp12& a12,
        const _Tp13& a13,
        const _Tp14& a14
        );

    template <
        typename _Tp0,
        typename _Tp1,
        typename _Tp2,
        typename _Tp3,
        typename _Tp4,
        typename _Tp5,
        typename _Tp6,
        typename _Tp7,
        typename _Tp8,
        typename _Tp9,
        typename _Tp10,
        typename _Tp11,
        typename _Tp12,
        typename _Tp13,
        typename _Tp14,
        typename _Tp15
        >
    Kernel&
    args(
        const _Tp0& a0,
        const _Tp1& a1,
        const _Tp2& a2,
        const _Tp3& a3,
        const _Tp4& a4,
        const _Tp5& a5,
        const _Tp6& a6,
        const _Tp7& a7,
        const _Tp8& a8,
        const _Tp9& a9,
        const _Tp10& a10,
        const _Tp11& a11,
        const _Tp12& a12,
        const _Tp13& a13,
        const _Tp14& a14,
        const _Tp15& a15
        );

    bool
    compileWorkGroupSize(size_t wsz []) const;

    bool
    create(
        const char* kname,
        const Program& prog
        );

    bool
    create(
        const char* kname,
        const ProgramSource& prog,
        const String& buildopts,
        String* errmsg = 0
        );

    bool
    empty() const;

    size_t
    localMemSize() const;

    Kernel&
    operator=(const Kernel& k);

    size_t
    preferedWorkGroupSizeMultiple() const;

    void*
    ptr() const;

    bool
    run(
        int dims,
        size_t globalsize [],
        size_t localsize [],
        bool sync,
        const Queue& q = Queue()
        );

    bool
    runTask(
        bool sync,
        const Queue& q = Queue()
        );

    int
    set(
        int i,
        const void* value,
        size_t sz
        );

    int
    set(
        int i,
        const Image2D& image2D
        );

    int
    set(
        int i,
        const UMat& m
        );

    int
    set(
        int i,
        const KernelArg& arg
        );

    template <typename _Tp>
    int
    set(
        int i,
        const _Tp& value
        );

    size_t
    workGroupSize() const;

protected:
    // fields

    Impl* p;
};

Detailed Documentation

Methods

bool
run(
    int dims,
    size_t globalsize [],
    size_t localsize [],
    bool sync,
    const Queue& q = Queue()
    )

Run the OpenCL kernel.

Parameters:

dims the work problem dimensions. It is the length of globalsize and localsize. It can be either 1, 2 or 3.
globalsize work items for each dimension. It is not the final globalsize passed to OpenCL. Each dimension will be adjusted to the nearest integer divisible by the corresponding value in localsize. If localsize is NULL, it will still be adjusted depending on dims. The adjusted values are greater than or equal to the original values.
localsize work-group size for each dimension.
sync specify whether to wait for OpenCL computation to finish before return.
q command queue