/* * Copyright (C) 2011-2013 Karlsruhe Institute of Technology * * This file is part of Ufo. * * This library is free software: you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation, either * version 3 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with this library. If not, see . */ #include "config.h" #ifdef __APPLE__ #include #else #include #endif #include #include "ufo-blur-task.h" struct _UfoBlurTaskPrivate { guint size; gfloat sigma; cl_context context; cl_kernel h_kernel; cl_kernel v_kernel; cl_mem weights_mem; cl_mem intermediate_mem; }; static void ufo_task_interface_init (UfoTaskIface *iface); G_DEFINE_TYPE_WITH_CODE (UfoBlurTask, ufo_blur_task, UFO_TYPE_TASK_NODE, G_IMPLEMENT_INTERFACE (UFO_TYPE_TASK, ufo_task_interface_init)) #define UFO_BLUR_TASK_GET_PRIVATE(obj) (G_TYPE_INSTANCE_GET_PRIVATE((obj), UFO_TYPE_BLUR_TASK, UfoBlurTaskPrivate)) enum { PROP_0, PROP_SIZE, PROP_SIGMA, N_PROPERTIES }; static GParamSpec *properties[N_PROPERTIES] = { NULL, }; UfoNode * ufo_blur_task_new (void) { return UFO_NODE (g_object_new (UFO_TYPE_BLUR_TASK, NULL)); } static void ufo_blur_task_setup (UfoTask *task, UfoResources *resources, GError **error) { UfoBlurTaskPrivate *priv; priv = UFO_BLUR_TASK_GET_PRIVATE (task); priv->h_kernel = ufo_resources_get_kernel (resources, "gaussian.cl", "h_gaussian", NULL, error); if (error && *error) return; priv->v_kernel = ufo_resources_get_kernel (resources, "gaussian.cl", "v_gaussian", NULL, error); if (error && *error) return; UFO_RESOURCES_CHECK_SET_AND_RETURN (clRetainKernel (priv->h_kernel), error); UFO_RESOURCES_CHECK_SET_AND_RETURN (clRetainKernel (priv->v_kernel), error); priv->context = ufo_resources_get_context (resources); UFO_RESOURCES_CHECK_SET_AND_RETURN (clRetainContext (priv->context), error); } static void ufo_blur_task_get_requisition (UfoTask *task, UfoBuffer **inputs, UfoRequisition *requisition, GError **error) { UfoBlurTaskPrivate *priv; priv = UFO_BLUR_TASK_GET_PRIVATE (task); ufo_buffer_get_requisition (inputs[0], requisition); if (priv->weights_mem == NULL) { guint kernel_size; guint kernel_size_2; gfloat *weights; gfloat sum; cl_int err; kernel_size = priv->size; kernel_size_2 = kernel_size / 2; sum = 0.0; weights = g_malloc0 (kernel_size * sizeof(gfloat)); for (guint i = 0; i < kernel_size_2 + 1; i++) { gfloat x = (gfloat) (kernel_size_2 - i); weights[i] = (gfloat) (1.0 / (priv->sigma * sqrt(2*G_PI)) * exp((x * x) / (-2.0 * priv->sigma * priv->sigma))); weights[kernel_size-i-1] = weights[i]; } for (guint i = 0; i < kernel_size; i++) sum += weights[i]; for (guint i = 0; i < kernel_size; i++) weights[i] /= sum; priv->weights_mem = clCreateBuffer (priv->context, CL_MEM_READ_ONLY | CL_MEM_COPY_HOST_PTR, kernel_size * sizeof(gfloat), weights, &err); UFO_RESOURCES_CHECK_CLERR (err); UFO_RESOURCES_CHECK_CLERR (clSetKernelArg (priv->h_kernel, 2, sizeof(cl_mem), &priv->weights_mem)); UFO_RESOURCES_CHECK_CLERR (clSetKernelArg (priv->v_kernel, 2, sizeof(cl_mem), &priv->weights_mem)); UFO_RESOURCES_CHECK_CLERR (clSetKernelArg (priv->h_kernel, 3, sizeof(guint), &kernel_size_2)); UFO_RESOURCES_CHECK_CLERR (clSetKernelArg (priv->v_kernel, 3, sizeof(guint), &kernel_size_2)); g_free(weights); } if (priv->intermediate_mem == NULL) { gsize size; cl_int err; size = requisition->dims[0] * requisition->dims[1] * sizeof (gfloat); priv->intermediate_mem = clCreateBuffer (priv->context, CL_MEM_READ_WRITE, size, NULL, &err); UFO_RESOURCES_CHECK_CLERR (err); } } static guint ufo_blur_task_get_num_inputs (UfoTask *task) { return 1; } static guint ufo_blur_task_get_num_dimensions (UfoTask *task, guint input) { g_return_val_if_fail (input == 0, 0); return 2; } static UfoTaskMode ufo_blur_task_get_mode (UfoTask *task) { return UFO_TASK_MODE_PROCESSOR | UFO_TASK_MODE_GPU; } static gboolean ufo_blur_task_process (UfoTask *task, UfoBuffer **inputs, UfoBuffer *output, UfoRequisition *requisition) { UfoBlurTaskPrivate *priv; UfoGpuNode *node; cl_command_queue cmd_queue; cl_mem in_mem; cl_mem out_mem; priv = UFO_BLUR_TASK_GET_PRIVATE (task); node = UFO_GPU_NODE (ufo_task_node_get_proc_node (UFO_TASK_NODE (task))); cmd_queue = ufo_gpu_node_get_cmd_queue (node); in_mem = ufo_buffer_get_device_array (inputs[0], cmd_queue); UFO_RESOURCES_CHECK_CLERR (clSetKernelArg (priv->h_kernel, 0, sizeof(cl_mem), &in_mem)); UFO_RESOURCES_CHECK_CLERR (clSetKernelArg (priv->h_kernel, 1, sizeof(cl_mem), &priv->intermediate_mem)); UFO_RESOURCES_CHECK_CLERR (clEnqueueNDRangeKernel (cmd_queue, priv->h_kernel, 2, NULL, requisition->dims, NULL, 0, NULL, NULL)); out_mem = ufo_buffer_get_device_array (output, cmd_queue); UFO_RESOURCES_CHECK_CLERR (clSetKernelArg (priv->v_kernel, 0, sizeof(cl_mem), &priv->intermediate_mem)); UFO_RESOURCES_CHECK_CLERR (clSetKernelArg (priv->v_kernel, 1, sizeof(cl_mem), &out_mem)); UFO_RESOURCES_CHECK_CLERR (clEnqueueNDRangeKernel (cmd_queue, priv->v_kernel, 2, NULL, requisition->dims, NULL, 0, NULL, NULL)); return TRUE; } static void ufo_blur_task_set_property (GObject *object, guint property_id, const GValue *value, GParamSpec *pspec) { UfoBlurTaskPrivate *priv = UFO_BLUR_TASK_GET_PRIVATE (object); switch (property_id) { case PROP_SIZE: priv->size = g_value_get_uint(value); break; case PROP_SIGMA: priv->sigma = g_value_get_float(value); break; default: G_OBJECT_WARN_INVALID_PROPERTY_ID (object, property_id, pspec); break; } } static void ufo_blur_task_get_property (GObject *object, guint property_id, GValue *value, GParamSpec *pspec) { UfoBlurTaskPrivate *priv = UFO_BLUR_TASK_GET_PRIVATE (object); switch (property_id) { case PROP_SIZE: g_value_set_uint(value, priv->size); break; case PROP_SIGMA: g_value_set_float(value, priv->sigma); break; default: G_OBJECT_WARN_INVALID_PROPERTY_ID (object, property_id, pspec); break; } } static void ufo_blur_task_finalize (GObject *object) { UfoBlurTaskPrivate *priv; priv = UFO_BLUR_TASK_GET_PRIVATE (object); if (priv->h_kernel) { UFO_RESOURCES_CHECK_CLERR (clReleaseKernel (priv->h_kernel)); priv->h_kernel = NULL; } if (priv->v_kernel) { UFO_RESOURCES_CHECK_CLERR (clReleaseKernel (priv->v_kernel)); priv->v_kernel = NULL; } if (priv->weights_mem) { UFO_RESOURCES_CHECK_CLERR (clReleaseMemObject (priv->weights_mem)); priv->weights_mem = NULL; } if (priv->intermediate_mem) { UFO_RESOURCES_CHECK_CLERR (clReleaseMemObject (priv->intermediate_mem)); priv->intermediate_mem = NULL; } if (priv->context) { UFO_RESOURCES_CHECK_CLERR (clReleaseContext (priv->context)); priv->context = NULL; } G_OBJECT_CLASS (ufo_blur_task_parent_class)->finalize (object); } static void ufo_task_interface_init (UfoTaskIface *iface) { iface->setup = ufo_blur_task_setup; iface->get_num_inputs = ufo_blur_task_get_num_inputs; iface->get_num_dimensions = ufo_blur_task_get_num_dimensions; iface->get_mode = ufo_blur_task_get_mode; iface->get_requisition = ufo_blur_task_get_requisition; iface->process = ufo_blur_task_process; } static void ufo_blur_task_class_init (UfoBlurTaskClass *klass) { GObjectClass *gobject_class = G_OBJECT_CLASS (klass); gobject_class->set_property = ufo_blur_task_set_property; gobject_class->get_property = ufo_blur_task_get_property; gobject_class->finalize = ufo_blur_task_finalize; properties[PROP_SIZE] = g_param_spec_uint("size", "Size of the kernel", "Size of the kernel", 3, 1000, 5, G_PARAM_READWRITE); properties[PROP_SIGMA] = g_param_spec_float("sigma", "sigma", "sigma", 1.0f, 1000.0f, 1.0f, G_PARAM_READWRITE); for (guint i = PROP_0 + 1; i < N_PROPERTIES; i++) g_object_class_install_property (gobject_class, i, properties[i]); g_type_class_add_private (gobject_class, sizeof(UfoBlurTaskPrivate)); } static void ufo_blur_task_init(UfoBlurTask *self) { self->priv = UFO_BLUR_TASK_GET_PRIVATE(self); self->priv->size = 5; self->priv->sigma = 1.0f; self->priv->weights_mem = NULL; self->priv->intermediate_mem = NULL; }