// // Copyright 2012 Francisco Jerez // // Permission is hereby granted, free of charge, to any person obtaining a // copy of this software and associated documentation files (the "Software"), // to deal in the Software without restriction, including without limitation // the rights to use, copy, modify, merge, publish, distribute, sublicense, // and/or sell copies of the Software, and to permit persons to whom the // Software is furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in // all copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL // THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR // OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, // ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR // OTHER DEALINGS IN THE SOFTWARE. // #include "util/u_math.h" #include "api/util.hpp" #include "core/memory.hpp" #include "core/format.hpp" using namespace clover; namespace { cl_mem_flags validate_flags(cl_mem d_parent, cl_mem_flags d_flags) { const cl_mem_flags dev_access_flags = CL_MEM_READ_WRITE | CL_MEM_WRITE_ONLY | CL_MEM_READ_ONLY; const cl_mem_flags host_ptr_flags = CL_MEM_USE_HOST_PTR | CL_MEM_ALLOC_HOST_PTR | CL_MEM_COPY_HOST_PTR; const cl_mem_flags host_access_flags = CL_MEM_HOST_WRITE_ONLY | CL_MEM_HOST_READ_ONLY | CL_MEM_HOST_NO_ACCESS; const cl_mem_flags valid_flags = dev_access_flags | host_access_flags | (d_parent ? 0 : host_ptr_flags); if ((d_flags & ~valid_flags) || util_bitcount(d_flags & dev_access_flags) > 1 || util_bitcount(d_flags & host_access_flags) > 1) throw error(CL_INVALID_VALUE); if ((d_flags & CL_MEM_USE_HOST_PTR) && (d_flags & (CL_MEM_COPY_HOST_PTR | CL_MEM_ALLOC_HOST_PTR))) throw error(CL_INVALID_VALUE); if (d_parent) { const auto &parent = obj(d_parent); const cl_mem_flags flags = (d_flags | (d_flags & dev_access_flags ? 0 : parent.flags() & dev_access_flags) | (d_flags & host_access_flags ? 0 : parent.flags() & host_access_flags) | (parent.flags() & host_ptr_flags)); if (~flags & parent.flags() & ((dev_access_flags & ~CL_MEM_READ_WRITE) | host_access_flags)) throw error(CL_INVALID_VALUE); return flags; } else { return d_flags | (d_flags & dev_access_flags ? 0 : CL_MEM_READ_WRITE); } } } CLOVER_API cl_mem clCreateBuffer(cl_context d_ctx, cl_mem_flags d_flags, size_t size, void *host_ptr, cl_int *r_errcode) try { const cl_mem_flags flags = validate_flags(NULL, d_flags); auto &ctx = obj(d_ctx); if (bool(host_ptr) != bool(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))) throw error(CL_INVALID_HOST_PTR); if (!size || size > fold(maximum(), cl_ulong(0), map(std::mem_fn(&device::max_mem_alloc_size), ctx.devices()) )) throw error(CL_INVALID_BUFFER_SIZE); ret_error(r_errcode, CL_SUCCESS); return new root_buffer(ctx, flags, size, host_ptr); } catch (error &e) { ret_error(r_errcode, e); return NULL; } CLOVER_API cl_mem clCreateSubBuffer(cl_mem d_mem, cl_mem_flags d_flags, cl_buffer_create_type op, const void *op_info, cl_int *r_errcode) try { auto &parent = obj(d_mem); const cl_mem_flags flags = validate_flags(d_mem, d_flags); if (op == CL_BUFFER_CREATE_TYPE_REGION) { auto reg = reinterpret_cast(op_info); if (!reg || reg->origin > parent.size() || reg->origin + reg->size > parent.size()) throw error(CL_INVALID_VALUE); if (!reg->size) throw error(CL_INVALID_BUFFER_SIZE); ret_error(r_errcode, CL_SUCCESS); return new sub_buffer(parent, flags, reg->origin, reg->size); } else { throw error(CL_INVALID_VALUE); } } catch (error &e) { ret_error(r_errcode, e); return NULL; } CLOVER_API cl_mem clCreateImage(cl_context d_ctx, cl_mem_flags d_flags, const cl_image_format *format, const cl_image_desc *desc, void *host_ptr, cl_int *r_errcode) try { auto &ctx = obj(d_ctx); if (!any_of(std::mem_fn(&device::image_support), ctx.devices())) throw error(CL_INVALID_OPERATION); if (!format) throw error(CL_INVALID_IMAGE_FORMAT_DESCRIPTOR); if (!desc) throw error(CL_INVALID_IMAGE_DESCRIPTOR); if (desc->image_array_size == 0 && (desc->image_type == CL_MEM_OBJECT_IMAGE1D_ARRAY || desc->image_type == CL_MEM_OBJECT_IMAGE2D_ARRAY)) throw error(CL_INVALID_IMAGE_DESCRIPTOR); if (!host_ptr && (desc->image_row_pitch || desc->image_slice_pitch)) throw error(CL_INVALID_IMAGE_DESCRIPTOR); if (desc->num_mip_levels || desc->num_samples) throw error(CL_INVALID_IMAGE_DESCRIPTOR); if (bool(desc->buffer) != (desc->image_type == CL_MEM_OBJECT_IMAGE1D_BUFFER)) throw error(CL_INVALID_IMAGE_DESCRIPTOR); if (bool(host_ptr) != bool(d_flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))) throw error(CL_INVALID_HOST_PTR); const cl_mem_flags flags = validate_flags(desc->buffer, d_flags); if (!supported_formats(ctx, desc->image_type).count(*format)) throw error(CL_IMAGE_FORMAT_NOT_SUPPORTED); ret_error(r_errcode, CL_SUCCESS); switch (desc->image_type) { case CL_MEM_OBJECT_IMAGE2D: if (!desc->image_width || !desc->image_height) throw error(CL_INVALID_IMAGE_SIZE); if (all_of([=](const device &dev) { const size_t max = 1 << dev.max_image_levels_2d(); return (desc->image_width > max || desc->image_height > max); }, ctx.devices())) throw error(CL_INVALID_IMAGE_SIZE); return new image2d(ctx, flags, format, desc->image_width, desc->image_height, desc->image_row_pitch, host_ptr); case CL_MEM_OBJECT_IMAGE3D: if (!desc->image_width || !desc->image_height || !desc->image_depth) throw error(CL_INVALID_IMAGE_SIZE); if (all_of([=](const device &dev) { const size_t max = 1 << dev.max_image_levels_3d(); return (desc->image_width > max || desc->image_height > max || desc->image_depth > max); }, ctx.devices())) throw error(CL_INVALID_IMAGE_SIZE); return new image3d(ctx, flags, format, desc->image_width, desc->image_height, desc->image_depth, desc->image_row_pitch, desc->image_slice_pitch, host_ptr); case CL_MEM_OBJECT_IMAGE1D: case CL_MEM_OBJECT_IMAGE1D_ARRAY: case CL_MEM_OBJECT_IMAGE1D_BUFFER: case CL_MEM_OBJECT_IMAGE2D_ARRAY: // XXX - Not implemented. throw error(CL_IMAGE_FORMAT_NOT_SUPPORTED); default: throw error(CL_INVALID_IMAGE_DESCRIPTOR); } } catch (error &e) { ret_error(r_errcode, e); return NULL; } CLOVER_API cl_mem clCreateImage2D(cl_context d_ctx, cl_mem_flags d_flags, const cl_image_format *format, size_t width, size_t height, size_t row_pitch, void *host_ptr, cl_int *r_errcode) { const cl_image_desc desc = { CL_MEM_OBJECT_IMAGE2D, width, height, 0, 0, row_pitch, 0, 0, 0, NULL }; return clCreateImage(d_ctx, d_flags, format, &desc, host_ptr, r_errcode); } CLOVER_API cl_mem clCreateImage3D(cl_context d_ctx, cl_mem_flags d_flags, const cl_image_format *format, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, void *host_ptr, cl_int *r_errcode) { const cl_image_desc desc = { CL_MEM_OBJECT_IMAGE3D, width, height, depth, 0, row_pitch, slice_pitch, 0, 0, NULL }; return clCreateImage(d_ctx, d_flags, format, &desc, host_ptr, r_errcode); } CLOVER_API cl_int clGetSupportedImageFormats(cl_context d_ctx, cl_mem_flags flags, cl_mem_object_type type, cl_uint count, cl_image_format *r_buf, cl_uint *r_count) try { auto &ctx = obj(d_ctx); auto formats = supported_formats(ctx, type); validate_flags(NULL, flags); if (r_buf && !r_count) throw error(CL_INVALID_VALUE); if (r_buf) std::copy_n(formats.begin(), std::min((cl_uint)formats.size(), count), r_buf); if (r_count) *r_count = formats.size(); return CL_SUCCESS; } catch (error &e) { return e.get(); } CLOVER_API cl_int clGetMemObjectInfo(cl_mem d_mem, cl_mem_info param, size_t size, void *r_buf, size_t *r_size) try { property_buffer buf { r_buf, size, r_size }; auto &mem = obj(d_mem); switch (param) { case CL_MEM_TYPE: buf.as_scalar() = mem.type(); break; case CL_MEM_FLAGS: buf.as_scalar() = mem.flags(); break; case CL_MEM_SIZE: buf.as_scalar() = mem.size(); break; case CL_MEM_HOST_PTR: buf.as_scalar() = mem.host_ptr(); break; case CL_MEM_MAP_COUNT: buf.as_scalar() = 0; break; case CL_MEM_REFERENCE_COUNT: buf.as_scalar() = mem.ref_count(); break; case CL_MEM_CONTEXT: buf.as_scalar() = desc(mem.context()); break; case CL_MEM_ASSOCIATED_MEMOBJECT: { sub_buffer *sub = dynamic_cast(&mem); buf.as_scalar() = (sub ? desc(sub->parent()) : NULL); break; } case CL_MEM_OFFSET: { sub_buffer *sub = dynamic_cast(&mem); buf.as_scalar() = (sub ? sub->offset() : 0); break; } default: throw error(CL_INVALID_VALUE); } return CL_SUCCESS; } catch (error &e) { return e.get(); } CLOVER_API cl_int clGetImageInfo(cl_mem d_mem, cl_image_info param, size_t size, void *r_buf, size_t *r_size) try { property_buffer buf { r_buf, size, r_size }; auto &img = obj(d_mem); switch (param) { case CL_IMAGE_FORMAT: buf.as_scalar() = img.format(); break; case CL_IMAGE_ELEMENT_SIZE: buf.as_scalar() = 0; break; case CL_IMAGE_ROW_PITCH: buf.as_scalar() = img.row_pitch(); break; case CL_IMAGE_SLICE_PITCH: buf.as_scalar() = img.slice_pitch(); break; case CL_IMAGE_WIDTH: buf.as_scalar() = img.width(); break; case CL_IMAGE_HEIGHT: buf.as_scalar() = img.height(); break; case CL_IMAGE_DEPTH: buf.as_scalar() = img.depth(); break; default: throw error(CL_INVALID_VALUE); } return CL_SUCCESS; } catch (error &e) { return e.get(); } CLOVER_API cl_int clRetainMemObject(cl_mem d_mem) try { obj(d_mem).retain(); return CL_SUCCESS; } catch (error &e) { return e.get(); } CLOVER_API cl_int clReleaseMemObject(cl_mem d_mem) try { if (obj(d_mem).release()) delete pobj(d_mem); return CL_SUCCESS; } catch (error &e) { return e.get(); } CLOVER_API cl_int clSetMemObjectDestructorCallback(cl_mem d_mem, void (CL_CALLBACK *pfn_notify)(cl_mem, void *), void *user_data) try { auto &mem = obj(d_mem); if (!pfn_notify) return CL_INVALID_VALUE; mem.destroy_notify([=]{ pfn_notify(d_mem, user_data); }); return CL_SUCCESS; } catch (error &e) { return e.get(); } CLOVER_API cl_int clEnqueueFillBuffer(cl_command_queue command_queue, cl_mem buffer, const void *pattern, size_t pattern_size, size_t offset, size_t size, cl_uint num_events_in_wait_list, const cl_event *event_wait_list, cl_event *event) { CLOVER_NOT_SUPPORTED_UNTIL("1.2"); return CL_INVALID_VALUE; } CLOVER_API cl_int clEnqueueFillImage(cl_command_queue command_queue, cl_mem image, const void *fill_color, const size_t *origin, const size_t *region, cl_uint num_events_in_wait_list, const cl_event *event_wait_list, cl_event *event) { CLOVER_NOT_SUPPORTED_UNTIL("1.2"); return CL_INVALID_VALUE; }