123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614 |
- /*
- * Copyright (c) 2017, Mellanox Technologies inc. All rights reserved.
- *
- * This software is available to you under a choice of one of two
- * licenses. You may choose to be licensed under the terms of the GNU
- * General Public License (GPL) Version 2, available from the file
- * COPYING in the main directory of this source tree, or the
- * OpenIB.org BSD license below:
- *
- * Redistribution and use in source and binary forms, with or
- * without modification, are permitted provided that the following
- * conditions are met:
- *
- * - Redistributions of source code must retain the above
- * copyright notice, this list of conditions and the following
- * disclaimer.
- *
- * - Redistributions in binary form must reproduce the above
- * copyright notice, this list of conditions and the following
- * disclaimer in the documentation and/or other materials
- * provided with the distribution.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
- * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
- * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
- * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- */
- #include <rdma/rdma_user_ioctl.h>
- #include <rdma/uverbs_ioctl.h>
- #include "rdma_core.h"
- #include "uverbs.h"
- struct bundle_alloc_head {
- struct bundle_alloc_head *next;
- u8 data[];
- };
- struct bundle_priv {
- /* Must be first */
- struct bundle_alloc_head alloc_head;
- struct bundle_alloc_head *allocated_mem;
- size_t internal_avail;
- size_t internal_used;
- struct radix_tree_root *radix;
- const struct uverbs_api_ioctl_method *method_elm;
- void __rcu **radix_slots;
- unsigned long radix_slots_len;
- u32 method_key;
- struct ib_uverbs_attr __user *user_attrs;
- struct ib_uverbs_attr *uattrs;
- DECLARE_BITMAP(uobj_finalize, UVERBS_API_ATTR_BKEY_LEN);
- /*
- * Must be last. bundle ends in a flex array which overlaps
- * internal_buffer.
- */
- struct uverbs_attr_bundle bundle;
- u64 internal_buffer[32];
- };
- /*
- * Each method has an absolute minimum amount of memory it needs to allocate,
- * precompute that amount and determine if the onstack memory can be used or
- * if allocation is need.
- */
- void uapi_compute_bundle_size(struct uverbs_api_ioctl_method *method_elm,
- unsigned int num_attrs)
- {
- struct bundle_priv *pbundle;
- size_t bundle_size =
- offsetof(struct bundle_priv, internal_buffer) +
- sizeof(*pbundle->bundle.attrs) * method_elm->key_bitmap_len +
- sizeof(*pbundle->uattrs) * num_attrs;
- method_elm->use_stack = bundle_size <= sizeof(*pbundle);
- method_elm->bundle_size =
- ALIGN(bundle_size + 256, sizeof(*pbundle->internal_buffer));
- /* Do not want order-2 allocations for this. */
- WARN_ON_ONCE(method_elm->bundle_size > PAGE_SIZE);
- }
- /**
- * uverbs_alloc() - Quickly allocate memory for use with a bundle
- * @bundle: The bundle
- * @size: Number of bytes to allocate
- * @flags: Allocator flags
- *
- * The bundle allocator is intended for allocations that are connected with
- * processing the system call related to the bundle. The allocated memory is
- * always freed once the system call completes, and cannot be freed any other
- * way.
- *
- * This tries to use a small pool of pre-allocated memory for performance.
- */
- __malloc void *_uverbs_alloc(struct uverbs_attr_bundle *bundle, size_t size,
- gfp_t flags)
- {
- struct bundle_priv *pbundle =
- container_of(bundle, struct bundle_priv, bundle);
- size_t new_used;
- void *res;
- if (check_add_overflow(size, pbundle->internal_used, &new_used))
- return ERR_PTR(-EOVERFLOW);
- if (new_used > pbundle->internal_avail) {
- struct bundle_alloc_head *buf;
- buf = kvmalloc(struct_size(buf, data, size), flags);
- if (!buf)
- return ERR_PTR(-ENOMEM);
- buf->next = pbundle->allocated_mem;
- pbundle->allocated_mem = buf;
- return buf->data;
- }
- res = (void *)pbundle->internal_buffer + pbundle->internal_used;
- pbundle->internal_used =
- ALIGN(new_used, sizeof(*pbundle->internal_buffer));
- if (flags & __GFP_ZERO)
- memset(res, 0, size);
- return res;
- }
- EXPORT_SYMBOL(_uverbs_alloc);
- static bool uverbs_is_attr_cleared(const struct ib_uverbs_attr *uattr,
- u16 len)
- {
- if (uattr->len > sizeof(((struct ib_uverbs_attr *)0)->data))
- return ib_is_buffer_cleared(u64_to_user_ptr(uattr->data) + len,
- uattr->len - len);
- return !memchr_inv((const void *)&uattr->data + len,
- 0, uattr->len - len);
- }
- static int uverbs_process_attr(struct bundle_priv *pbundle,
- const struct uverbs_api_attr *attr_uapi,
- struct ib_uverbs_attr *uattr, u32 attr_bkey)
- {
- const struct uverbs_attr_spec *spec = &attr_uapi->spec;
- struct uverbs_attr *e = &pbundle->bundle.attrs[attr_bkey];
- const struct uverbs_attr_spec *val_spec = spec;
- struct uverbs_obj_attr *o_attr;
- switch (spec->type) {
- case UVERBS_ATTR_TYPE_ENUM_IN:
- if (uattr->attr_data.enum_data.elem_id >= spec->u.enum_def.num_elems)
- return -EOPNOTSUPP;
- if (uattr->attr_data.enum_data.reserved)
- return -EINVAL;
- val_spec = &spec->u2.enum_def.ids[uattr->attr_data.enum_data.elem_id];
- /* Currently we only support PTR_IN based enums */
- if (val_spec->type != UVERBS_ATTR_TYPE_PTR_IN)
- return -EOPNOTSUPP;
- e->ptr_attr.enum_id = uattr->attr_data.enum_data.elem_id;
- /* fall through */
- case UVERBS_ATTR_TYPE_PTR_IN:
- /* Ensure that any data provided by userspace beyond the known
- * struct is zero. Userspace that knows how to use some future
- * longer struct will fail here if used with an old kernel and
- * non-zero content, making ABI compat/discovery simpler.
- */
- if (uattr->len > val_spec->u.ptr.len &&
- val_spec->zero_trailing &&
- !uverbs_is_attr_cleared(uattr, val_spec->u.ptr.len))
- return -EOPNOTSUPP;
- /* fall through */
- case UVERBS_ATTR_TYPE_PTR_OUT:
- if (uattr->len < val_spec->u.ptr.min_len ||
- (!val_spec->zero_trailing &&
- uattr->len > val_spec->u.ptr.len))
- return -EINVAL;
- if (spec->type != UVERBS_ATTR_TYPE_ENUM_IN &&
- uattr->attr_data.reserved)
- return -EINVAL;
- e->ptr_attr.uattr_idx = uattr - pbundle->uattrs;
- e->ptr_attr.len = uattr->len;
- if (val_spec->alloc_and_copy && !uverbs_attr_ptr_is_inline(e)) {
- void *p;
- p = uverbs_alloc(&pbundle->bundle, uattr->len);
- if (IS_ERR(p))
- return PTR_ERR(p);
- e->ptr_attr.ptr = p;
- if (copy_from_user(p, u64_to_user_ptr(uattr->data),
- uattr->len))
- return -EFAULT;
- } else {
- e->ptr_attr.data = uattr->data;
- }
- break;
- case UVERBS_ATTR_TYPE_IDR:
- case UVERBS_ATTR_TYPE_FD:
- if (uattr->attr_data.reserved)
- return -EINVAL;
- if (uattr->len != 0)
- return -EINVAL;
- o_attr = &e->obj_attr;
- o_attr->attr_elm = attr_uapi;
- /*
- * The type of uattr->data is u64 for UVERBS_ATTR_TYPE_IDR and
- * s64 for UVERBS_ATTR_TYPE_FD. We can cast the u64 to s64
- * here without caring about truncation as we know that the
- * IDR implementation today rejects negative IDs
- */
- o_attr->uobject = uverbs_get_uobject_from_file(
- spec->u.obj.obj_type,
- pbundle->bundle.ufile,
- spec->u.obj.access,
- uattr->data_s64);
- if (IS_ERR(o_attr->uobject))
- return PTR_ERR(o_attr->uobject);
- __set_bit(attr_bkey, pbundle->uobj_finalize);
- if (spec->u.obj.access == UVERBS_ACCESS_NEW) {
- unsigned int uattr_idx = uattr - pbundle->uattrs;
- s64 id = o_attr->uobject->id;
- /* Copy the allocated id to the user-space */
- if (put_user(id, &pbundle->user_attrs[uattr_idx].data))
- return -EFAULT;
- }
- break;
- default:
- return -EOPNOTSUPP;
- }
- return 0;
- }
- /*
- * We search the radix tree with the method prefix and now we want to fast
- * search the suffix bits to get a particular attribute pointer. It is not
- * totally clear to me if this breaks the radix tree encasulation or not, but
- * it uses the iter data to determine if the method iter points at the same
- * chunk that will store the attribute, if so it just derefs it directly. By
- * construction in most kernel configs the method and attrs will all fit in a
- * single radix chunk, so in most cases this will have no search. Other cases
- * this falls back to a full search.
- */
- static void __rcu **uapi_get_attr_for_method(struct bundle_priv *pbundle,
- u32 attr_key)
- {
- void __rcu **slot;
- if (likely(attr_key < pbundle->radix_slots_len)) {
- void *entry;
- slot = pbundle->radix_slots + attr_key;
- entry = rcu_dereference_raw(*slot);
- if (likely(!radix_tree_is_internal_node(entry) && entry))
- return slot;
- }
- return radix_tree_lookup_slot(pbundle->radix,
- pbundle->method_key | attr_key);
- }
- static int uverbs_set_attr(struct bundle_priv *pbundle,
- struct ib_uverbs_attr *uattr)
- {
- u32 attr_key = uapi_key_attr(uattr->attr_id);
- u32 attr_bkey = uapi_bkey_attr(attr_key);
- const struct uverbs_api_attr *attr;
- void __rcu **slot;
- int ret;
- slot = uapi_get_attr_for_method(pbundle, attr_key);
- if (!slot) {
- /*
- * Kernel does not support the attribute but user-space says it
- * is mandatory
- */
- if (uattr->flags & UVERBS_ATTR_F_MANDATORY)
- return -EPROTONOSUPPORT;
- return 0;
- }
- attr = srcu_dereference(
- *slot, &pbundle->bundle.ufile->device->disassociate_srcu);
- /* Reject duplicate attributes from user-space */
- if (test_bit(attr_bkey, pbundle->bundle.attr_present))
- return -EINVAL;
- ret = uverbs_process_attr(pbundle, attr, uattr, attr_bkey);
- if (ret)
- return ret;
- __set_bit(attr_bkey, pbundle->bundle.attr_present);
- return 0;
- }
- static int ib_uverbs_run_method(struct bundle_priv *pbundle,
- unsigned int num_attrs)
- {
- int (*handler)(struct ib_uverbs_file *ufile,
- struct uverbs_attr_bundle *ctx);
- size_t uattrs_size = array_size(sizeof(*pbundle->uattrs), num_attrs);
- unsigned int destroy_bkey = pbundle->method_elm->destroy_bkey;
- unsigned int i;
- int ret;
- /* See uverbs_disassociate_api() */
- handler = srcu_dereference(
- pbundle->method_elm->handler,
- &pbundle->bundle.ufile->device->disassociate_srcu);
- if (!handler)
- return -EIO;
- pbundle->uattrs = uverbs_alloc(&pbundle->bundle, uattrs_size);
- if (IS_ERR(pbundle->uattrs))
- return PTR_ERR(pbundle->uattrs);
- if (copy_from_user(pbundle->uattrs, pbundle->user_attrs, uattrs_size))
- return -EFAULT;
- for (i = 0; i != num_attrs; i++) {
- ret = uverbs_set_attr(pbundle, &pbundle->uattrs[i]);
- if (unlikely(ret))
- return ret;
- }
- /* User space did not provide all the mandatory attributes */
- if (unlikely(!bitmap_subset(pbundle->method_elm->attr_mandatory,
- pbundle->bundle.attr_present,
- pbundle->method_elm->key_bitmap_len)))
- return -EINVAL;
- if (destroy_bkey != UVERBS_API_ATTR_BKEY_LEN) {
- struct uverbs_obj_attr *destroy_attr =
- &pbundle->bundle.attrs[destroy_bkey].obj_attr;
- ret = uobj_destroy(destroy_attr->uobject);
- if (ret)
- return ret;
- __clear_bit(destroy_bkey, pbundle->uobj_finalize);
- ret = handler(pbundle->bundle.ufile, &pbundle->bundle);
- uobj_put_destroy(destroy_attr->uobject);
- } else {
- ret = handler(pbundle->bundle.ufile, &pbundle->bundle);
- }
- /*
- * EPROTONOSUPPORT is ONLY to be returned if the ioctl framework can
- * not invoke the method because the request is not supported. No
- * other cases should return this code.
- */
- if (WARN_ON_ONCE(ret == -EPROTONOSUPPORT))
- return -EINVAL;
- return ret;
- }
- static int bundle_destroy(struct bundle_priv *pbundle, bool commit)
- {
- unsigned int key_bitmap_len = pbundle->method_elm->key_bitmap_len;
- struct bundle_alloc_head *memblock;
- unsigned int i;
- int ret = 0;
- i = -1;
- while ((i = find_next_bit(pbundle->uobj_finalize, key_bitmap_len,
- i + 1)) < key_bitmap_len) {
- struct uverbs_attr *attr = &pbundle->bundle.attrs[i];
- int current_ret;
- current_ret = uverbs_finalize_object(
- attr->obj_attr.uobject,
- attr->obj_attr.attr_elm->spec.u.obj.access, commit);
- if (!ret)
- ret = current_ret;
- }
- for (memblock = pbundle->allocated_mem; memblock;) {
- struct bundle_alloc_head *tmp = memblock;
- memblock = memblock->next;
- kvfree(tmp);
- }
- return ret;
- }
- static int ib_uverbs_cmd_verbs(struct ib_uverbs_file *ufile,
- struct ib_uverbs_ioctl_hdr *hdr,
- struct ib_uverbs_attr __user *user_attrs)
- {
- const struct uverbs_api_ioctl_method *method_elm;
- struct uverbs_api *uapi = ufile->device->uapi;
- struct radix_tree_iter attrs_iter;
- struct bundle_priv *pbundle;
- struct bundle_priv onstack;
- void __rcu **slot;
- int destroy_ret;
- int ret;
- if (unlikely(hdr->driver_id != uapi->driver_id))
- return -EINVAL;
- slot = radix_tree_iter_lookup(
- &uapi->radix, &attrs_iter,
- uapi_key_obj(hdr->object_id) |
- uapi_key_ioctl_method(hdr->method_id));
- if (unlikely(!slot))
- return -EPROTONOSUPPORT;
- method_elm = srcu_dereference(*slot, &ufile->device->disassociate_srcu);
- if (!method_elm->use_stack) {
- pbundle = kmalloc(method_elm->bundle_size, GFP_KERNEL);
- if (!pbundle)
- return -ENOMEM;
- pbundle->internal_avail =
- method_elm->bundle_size -
- offsetof(struct bundle_priv, internal_buffer);
- pbundle->alloc_head.next = NULL;
- pbundle->allocated_mem = &pbundle->alloc_head;
- } else {
- pbundle = &onstack;
- pbundle->internal_avail = sizeof(pbundle->internal_buffer);
- pbundle->allocated_mem = NULL;
- }
- /* Space for the pbundle->bundle.attrs flex array */
- pbundle->method_elm = method_elm;
- pbundle->method_key = attrs_iter.index;
- pbundle->bundle.ufile = ufile;
- pbundle->radix = &uapi->radix;
- pbundle->radix_slots = slot;
- pbundle->radix_slots_len = radix_tree_chunk_size(&attrs_iter);
- pbundle->user_attrs = user_attrs;
- pbundle->internal_used = ALIGN(pbundle->method_elm->key_bitmap_len *
- sizeof(*pbundle->bundle.attrs),
- sizeof(*pbundle->internal_buffer));
- memset(pbundle->bundle.attr_present, 0,
- sizeof(pbundle->bundle.attr_present));
- memset(pbundle->uobj_finalize, 0, sizeof(pbundle->uobj_finalize));
- ret = ib_uverbs_run_method(pbundle, hdr->num_attrs);
- destroy_ret = bundle_destroy(pbundle, ret == 0);
- if (unlikely(destroy_ret && !ret))
- return destroy_ret;
- return ret;
- }
- long ib_uverbs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
- {
- struct ib_uverbs_file *file = filp->private_data;
- struct ib_uverbs_ioctl_hdr __user *user_hdr =
- (struct ib_uverbs_ioctl_hdr __user *)arg;
- struct ib_uverbs_ioctl_hdr hdr;
- int srcu_key;
- int err;
- if (unlikely(cmd != RDMA_VERBS_IOCTL))
- return -ENOIOCTLCMD;
- err = copy_from_user(&hdr, user_hdr, sizeof(hdr));
- if (err)
- return -EFAULT;
- if (hdr.length > PAGE_SIZE ||
- hdr.length != struct_size(&hdr, attrs, hdr.num_attrs))
- return -EINVAL;
- if (hdr.reserved1 || hdr.reserved2)
- return -EPROTONOSUPPORT;
- srcu_key = srcu_read_lock(&file->device->disassociate_srcu);
- err = ib_uverbs_cmd_verbs(file, &hdr, user_hdr->attrs);
- srcu_read_unlock(&file->device->disassociate_srcu, srcu_key);
- return err;
- }
- int uverbs_get_flags64(u64 *to, const struct uverbs_attr_bundle *attrs_bundle,
- size_t idx, u64 allowed_bits)
- {
- const struct uverbs_attr *attr;
- u64 flags;
- attr = uverbs_attr_get(attrs_bundle, idx);
- /* Missing attribute means 0 flags */
- if (IS_ERR(attr)) {
- *to = 0;
- return 0;
- }
- /*
- * New userspace code should use 8 bytes to pass flags, but we
- * transparently support old userspaces that were using 4 bytes as
- * well.
- */
- if (attr->ptr_attr.len == 8)
- flags = attr->ptr_attr.data;
- else if (attr->ptr_attr.len == 4)
- flags = *(u32 *)&attr->ptr_attr.data;
- else
- return -EINVAL;
- if (flags & ~allowed_bits)
- return -EINVAL;
- *to = flags;
- return 0;
- }
- EXPORT_SYMBOL(uverbs_get_flags64);
- int uverbs_get_flags32(u32 *to, const struct uverbs_attr_bundle *attrs_bundle,
- size_t idx, u64 allowed_bits)
- {
- u64 flags;
- int ret;
- ret = uverbs_get_flags64(&flags, attrs_bundle, idx, allowed_bits);
- if (ret)
- return ret;
- if (flags > U32_MAX)
- return -EINVAL;
- *to = flags;
- return 0;
- }
- EXPORT_SYMBOL(uverbs_get_flags32);
- /*
- * This is for ease of conversion. The purpose is to convert all drivers to
- * use uverbs_attr_bundle instead of ib_udata. Assume attr == 0 is input and
- * attr == 1 is output.
- */
- void create_udata(struct uverbs_attr_bundle *bundle, struct ib_udata *udata)
- {
- struct bundle_priv *pbundle =
- container_of(bundle, struct bundle_priv, bundle);
- const struct uverbs_attr *uhw_in =
- uverbs_attr_get(bundle, UVERBS_ATTR_UHW_IN);
- const struct uverbs_attr *uhw_out =
- uverbs_attr_get(bundle, UVERBS_ATTR_UHW_OUT);
- if (!IS_ERR(uhw_in)) {
- udata->inlen = uhw_in->ptr_attr.len;
- if (uverbs_attr_ptr_is_inline(uhw_in))
- udata->inbuf =
- &pbundle->user_attrs[uhw_in->ptr_attr.uattr_idx]
- .data;
- else
- udata->inbuf = u64_to_user_ptr(uhw_in->ptr_attr.data);
- } else {
- udata->inbuf = NULL;
- udata->inlen = 0;
- }
- if (!IS_ERR(uhw_out)) {
- udata->outbuf = u64_to_user_ptr(uhw_out->ptr_attr.data);
- udata->outlen = uhw_out->ptr_attr.len;
- } else {
- udata->outbuf = NULL;
- udata->outlen = 0;
- }
- }
- int uverbs_copy_to(const struct uverbs_attr_bundle *bundle, size_t idx,
- const void *from, size_t size)
- {
- struct bundle_priv *pbundle =
- container_of(bundle, struct bundle_priv, bundle);
- const struct uverbs_attr *attr = uverbs_attr_get(bundle, idx);
- u16 flags;
- size_t min_size;
- if (IS_ERR(attr))
- return PTR_ERR(attr);
- min_size = min_t(size_t, attr->ptr_attr.len, size);
- if (copy_to_user(u64_to_user_ptr(attr->ptr_attr.data), from, min_size))
- return -EFAULT;
- flags = pbundle->uattrs[attr->ptr_attr.uattr_idx].flags |
- UVERBS_ATTR_F_VALID_OUTPUT;
- if (put_user(flags,
- &pbundle->user_attrs[attr->ptr_attr.uattr_idx].flags))
- return -EFAULT;
- return 0;
- }
- EXPORT_SYMBOL(uverbs_copy_to);
|