linux/drivers/misc/vmw_vmci/vmci_context.c
<<
>>
Prefs
   1// SPDX-License-Identifier: GPL-2.0-only
   2/*
   3 * VMware VMCI Driver
   4 *
   5 * Copyright (C) 2012 VMware, Inc. All rights reserved.
   6 */
   7
   8#include <linux/vmw_vmci_defs.h>
   9#include <linux/vmw_vmci_api.h>
  10#include <linux/highmem.h>
  11#include <linux/kernel.h>
  12#include <linux/module.h>
  13#include <linux/sched.h>
  14#include <linux/cred.h>
  15#include <linux/slab.h>
  16
  17#include "vmci_queue_pair.h"
  18#include "vmci_datagram.h"
  19#include "vmci_doorbell.h"
  20#include "vmci_context.h"
  21#include "vmci_driver.h"
  22#include "vmci_event.h"
  23
  24/* Use a wide upper bound for the maximum contexts. */
  25#define VMCI_MAX_CONTEXTS 2000
  26
  27/*
  28 * List of current VMCI contexts.  Contexts can be added by
  29 * vmci_ctx_create() and removed via vmci_ctx_destroy().
  30 * These, along with context lookup, are protected by the
  31 * list structure's lock.
  32 */
  33static struct {
  34        struct list_head head;
  35        spinlock_t lock; /* Spinlock for context list operations */
  36} ctx_list = {
  37        .head = LIST_HEAD_INIT(ctx_list.head),
  38        .lock = __SPIN_LOCK_UNLOCKED(ctx_list.lock),
  39};
  40
  41/* Used by contexts that did not set up notify flag pointers */
  42static bool ctx_dummy_notify;
  43
  44static void ctx_signal_notify(struct vmci_ctx *context)
  45{
  46        *context->notify = true;
  47}
  48
  49static void ctx_clear_notify(struct vmci_ctx *context)
  50{
  51        *context->notify = false;
  52}
  53
  54/*
  55 * If nothing requires the attention of the guest, clears both
  56 * notify flag and call.
  57 */
  58static void ctx_clear_notify_call(struct vmci_ctx *context)
  59{
  60        if (context->pending_datagrams == 0 &&
  61            vmci_handle_arr_get_size(context->pending_doorbell_array) == 0)
  62                ctx_clear_notify(context);
  63}
  64
  65/*
  66 * Sets the context's notify flag iff datagrams are pending for this
  67 * context.  Called from vmci_setup_notify().
  68 */
  69void vmci_ctx_check_signal_notify(struct vmci_ctx *context)
  70{
  71        spin_lock(&context->lock);
  72        if (context->pending_datagrams)
  73                ctx_signal_notify(context);
  74        spin_unlock(&context->lock);
  75}
  76
  77/*
  78 * Allocates and initializes a VMCI context.
  79 */
  80struct vmci_ctx *vmci_ctx_create(u32 cid, u32 priv_flags,
  81                                 uintptr_t event_hnd,
  82                                 int user_version,
  83                                 const struct cred *cred)
  84{
  85        struct vmci_ctx *context;
  86        int error;
  87
  88        if (cid == VMCI_INVALID_ID) {
  89                pr_devel("Invalid context ID for VMCI context\n");
  90                error = -EINVAL;
  91                goto err_out;
  92        }
  93
  94        if (priv_flags & ~VMCI_PRIVILEGE_ALL_FLAGS) {
  95                pr_devel("Invalid flag (flags=0x%x) for VMCI context\n",
  96                         priv_flags);
  97                error = -EINVAL;
  98                goto err_out;
  99        }
 100
 101        if (user_version == 0) {
 102                pr_devel("Invalid suer_version %d\n", user_version);
 103                error = -EINVAL;
 104                goto err_out;
 105        }
 106
 107        context = kzalloc(sizeof(*context), GFP_KERNEL);
 108        if (!context) {
 109                pr_warn("Failed to allocate memory for VMCI context\n");
 110                error = -EINVAL;
 111                goto err_out;
 112        }
 113
 114        kref_init(&context->kref);
 115        spin_lock_init(&context->lock);
 116        INIT_LIST_HEAD(&context->list_item);
 117        INIT_LIST_HEAD(&context->datagram_queue);
 118        INIT_LIST_HEAD(&context->notifier_list);
 119
 120        /* Initialize host-specific VMCI context. */
 121        init_waitqueue_head(&context->host_context.wait_queue);
 122
 123        context->queue_pair_array =
 124                vmci_handle_arr_create(0, VMCI_MAX_GUEST_QP_COUNT);
 125        if (!context->queue_pair_array) {
 126                error = -ENOMEM;
 127                goto err_free_ctx;
 128        }
 129
 130        context->doorbell_array =
 131                vmci_handle_arr_create(0, VMCI_MAX_GUEST_DOORBELL_COUNT);
 132        if (!context->doorbell_array) {
 133                error = -ENOMEM;
 134                goto err_free_qp_array;
 135        }
 136
 137        context->pending_doorbell_array =
 138                vmci_handle_arr_create(0, VMCI_MAX_GUEST_DOORBELL_COUNT);
 139        if (!context->pending_doorbell_array) {
 140                error = -ENOMEM;
 141                goto err_free_db_array;
 142        }
 143
 144        context->user_version = user_version;
 145
 146        context->priv_flags = priv_flags;
 147
 148        if (cred)
 149                context->cred = get_cred(cred);
 150
 151        context->notify = &ctx_dummy_notify;
 152        context->notify_page = NULL;
 153
 154        /*
 155         * If we collide with an existing context we generate a new
 156         * and use it instead. The VMX will determine if regeneration
 157         * is okay. Since there isn't 4B - 16 VMs running on a given
 158         * host, the below loop will terminate.
 159         */
 160        spin_lock(&ctx_list.lock);
 161
 162        while (vmci_ctx_exists(cid)) {
 163                /* We reserve the lowest 16 ids for fixed contexts. */
 164                cid = max(cid, VMCI_RESERVED_CID_LIMIT - 1) + 1;
 165                if (cid == VMCI_INVALID_ID)
 166                        cid = VMCI_RESERVED_CID_LIMIT;
 167        }
 168        context->cid = cid;
 169
 170        list_add_tail_rcu(&context->list_item, &ctx_list.head);
 171        spin_unlock(&ctx_list.lock);
 172
 173        return context;
 174
 175 err_free_db_array:
 176        vmci_handle_arr_destroy(context->doorbell_array);
 177 err_free_qp_array:
 178        vmci_handle_arr_destroy(context->queue_pair_array);
 179 err_free_ctx:
 180        kfree(context);
 181 err_out:
 182        return ERR_PTR(error);
 183}
 184
 185/*
 186 * Destroy VMCI context.
 187 */
 188void vmci_ctx_destroy(struct vmci_ctx *context)
 189{
 190        spin_lock(&ctx_list.lock);
 191        list_del_rcu(&context->list_item);
 192        spin_unlock(&ctx_list.lock);
 193        synchronize_rcu();
 194
 195        vmci_ctx_put(context);
 196}
 197
 198/*
 199 * Fire notification for all contexts interested in given cid.
 200 */
 201static int ctx_fire_notification(u32 context_id, u32 priv_flags)
 202{
 203        u32 i, array_size;
 204        struct vmci_ctx *sub_ctx;
 205        struct vmci_handle_arr *subscriber_array;
 206        struct vmci_handle context_handle =
 207                vmci_make_handle(context_id, VMCI_EVENT_HANDLER);
 208
 209        /*
 210         * We create an array to hold the subscribers we find when
 211         * scanning through all contexts.
 212         */
 213        subscriber_array = vmci_handle_arr_create(0, VMCI_MAX_CONTEXTS);
 214        if (subscriber_array == NULL)
 215                return VMCI_ERROR_NO_MEM;
 216
 217        /*
 218         * Scan all contexts to find who is interested in being
 219         * notified about given contextID.
 220         */
 221        rcu_read_lock();
 222        list_for_each_entry_rcu(sub_ctx, &ctx_list.head, list_item) {
 223                struct vmci_handle_list *node;
 224
 225                /*
 226                 * We only deliver notifications of the removal of
 227                 * contexts, if the two contexts are allowed to
 228                 * interact.
 229                 */
 230                if (vmci_deny_interaction(priv_flags, sub_ctx->priv_flags))
 231                        continue;
 232
 233                list_for_each_entry_rcu(node, &sub_ctx->notifier_list, node) {
 234                        if (!vmci_handle_is_equal(node->handle, context_handle))
 235                                continue;
 236
 237                        vmci_handle_arr_append_entry(&subscriber_array,
 238                                        vmci_make_handle(sub_ctx->cid,
 239                                                         VMCI_EVENT_HANDLER));
 240                }
 241        }
 242        rcu_read_unlock();
 243
 244        /* Fire event to all subscribers. */
 245        array_size = vmci_handle_arr_get_size(subscriber_array);
 246        for (i = 0; i < array_size; i++) {
 247                int result;
 248                struct vmci_event_ctx ev;
 249
 250                ev.msg.hdr.dst = vmci_handle_arr_get_entry(subscriber_array, i);
 251                ev.msg.hdr.src = vmci_make_handle(VMCI_HYPERVISOR_CONTEXT_ID,
 252                                                  VMCI_CONTEXT_RESOURCE_ID);
 253                ev.msg.hdr.payload_size = sizeof(ev) - sizeof(ev.msg.hdr);
 254                ev.msg.event_data.event = VMCI_EVENT_CTX_REMOVED;
 255                ev.payload.context_id = context_id;
 256
 257                result = vmci_datagram_dispatch(VMCI_HYPERVISOR_CONTEXT_ID,
 258                                                &ev.msg.hdr, false);
 259                if (result < VMCI_SUCCESS) {
 260                        pr_devel("Failed to enqueue event datagram (type=%d) for context (ID=0x%x)\n",
 261                                 ev.msg.event_data.event,
 262                                 ev.msg.hdr.dst.context);
 263                        /* We continue to enqueue on next subscriber. */
 264                }
 265        }
 266        vmci_handle_arr_destroy(subscriber_array);
 267
 268        return VMCI_SUCCESS;
 269}
 270
 271/*
 272 * Returns the current number of pending datagrams. The call may
 273 * also serve as a synchronization point for the datagram queue,
 274 * as no enqueue operations can occur concurrently.
 275 */
 276int vmci_ctx_pending_datagrams(u32 cid, u32 *pending)
 277{
 278        struct vmci_ctx *context;
 279
 280        context = vmci_ctx_get(cid);
 281        if (context == NULL)
 282                return VMCI_ERROR_INVALID_ARGS;
 283
 284        spin_lock(&context->lock);
 285        if (pending)
 286                *pending = context->pending_datagrams;
 287        spin_unlock(&context->lock);
 288        vmci_ctx_put(context);
 289
 290        return VMCI_SUCCESS;
 291}
 292
 293/*
 294 * Queues a VMCI datagram for the appropriate target VM context.
 295 */
 296int vmci_ctx_enqueue_datagram(u32 cid, struct vmci_datagram *dg)
 297{
 298        struct vmci_datagram_queue_entry *dq_entry;
 299        struct vmci_ctx *context;
 300        struct vmci_handle dg_src;
 301        size_t vmci_dg_size;
 302
 303        vmci_dg_size = VMCI_DG_SIZE(dg);
 304        if (vmci_dg_size > VMCI_MAX_DG_SIZE) {
 305                pr_devel("Datagram too large (bytes=%zu)\n", vmci_dg_size);
 306                return VMCI_ERROR_INVALID_ARGS;
 307        }
 308
 309        /* Get the target VM's VMCI context. */
 310        context = vmci_ctx_get(cid);
 311        if (!context) {
 312                pr_devel("Invalid context (ID=0x%x)\n", cid);
 313                return VMCI_ERROR_INVALID_ARGS;
 314        }
 315
 316        /* Allocate guest call entry and add it to the target VM's queue. */
 317        dq_entry = kmalloc(sizeof(*dq_entry), GFP_KERNEL);
 318        if (dq_entry == NULL) {
 319                pr_warn("Failed to allocate memory for datagram\n");
 320                vmci_ctx_put(context);
 321                return VMCI_ERROR_NO_MEM;
 322        }
 323        dq_entry->dg = dg;
 324        dq_entry->dg_size = vmci_dg_size;
 325        dg_src = dg->src;
 326        INIT_LIST_HEAD(&dq_entry->list_item);
 327
 328        spin_lock(&context->lock);
 329
 330        /*
 331         * We put a higher limit on datagrams from the hypervisor.  If
 332         * the pending datagram is not from hypervisor, then we check
 333         * if enqueueing it would exceed the
 334         * VMCI_MAX_DATAGRAM_QUEUE_SIZE limit on the destination.  If
 335         * the pending datagram is from hypervisor, we allow it to be
 336         * queued at the destination side provided we don't reach the
 337         * VMCI_MAX_DATAGRAM_AND_EVENT_QUEUE_SIZE limit.
 338         */
 339        if (context->datagram_queue_size + vmci_dg_size >=
 340            VMCI_MAX_DATAGRAM_QUEUE_SIZE &&
 341            (!vmci_handle_is_equal(dg_src,
 342                                vmci_make_handle
 343                                (VMCI_HYPERVISOR_CONTEXT_ID,
 344                                 VMCI_CONTEXT_RESOURCE_ID)) ||
 345             context->datagram_queue_size + vmci_dg_size >=
 346             VMCI_MAX_DATAGRAM_AND_EVENT_QUEUE_SIZE)) {
 347                spin_unlock(&context->lock);
 348                vmci_ctx_put(context);
 349                kfree(dq_entry);
 350                pr_devel("Context (ID=0x%x) receive queue is full\n", cid);
 351                return VMCI_ERROR_NO_RESOURCES;
 352        }
 353
 354        list_add(&dq_entry->list_item, &context->datagram_queue);
 355        context->pending_datagrams++;
 356        context->datagram_queue_size += vmci_dg_size;
 357        ctx_signal_notify(context);
 358        wake_up(&context->host_context.wait_queue);
 359        spin_unlock(&context->lock);
 360        vmci_ctx_put(context);
 361
 362        return vmci_dg_size;
 363}
 364
 365/*
 366 * Verifies whether a context with the specified context ID exists.
 367 * FIXME: utility is dubious as no decisions can be reliably made
 368 * using this data as context can appear and disappear at any time.
 369 */
 370bool vmci_ctx_exists(u32 cid)
 371{
 372        struct vmci_ctx *context;
 373        bool exists = false;
 374
 375        rcu_read_lock();
 376
 377        list_for_each_entry_rcu(context, &ctx_list.head, list_item) {
 378                if (context->cid == cid) {
 379                        exists = true;
 380                        break;
 381                }
 382        }
 383
 384        rcu_read_unlock();
 385        return exists;
 386}
 387
 388/*
 389 * Retrieves VMCI context corresponding to the given cid.
 390 */
 391struct vmci_ctx *vmci_ctx_get(u32 cid)
 392{
 393        struct vmci_ctx *c, *context = NULL;
 394
 395        if (cid == VMCI_INVALID_ID)
 396                return NULL;
 397
 398        rcu_read_lock();
 399        list_for_each_entry_rcu(c, &ctx_list.head, list_item) {
 400                if (c->cid == cid) {
 401                        /*
 402                         * The context owner drops its own reference to the
 403                         * context only after removing it from the list and
 404                         * waiting for RCU grace period to expire. This
 405                         * means that we are not about to increase the
 406                         * reference count of something that is in the
 407                         * process of being destroyed.
 408                         */
 409                        context = c;
 410                        kref_get(&context->kref);
 411                        break;
 412                }
 413        }
 414        rcu_read_unlock();
 415
 416        return context;
 417}
 418
 419/*
 420 * Deallocates all parts of a context data structure. This
 421 * function doesn't lock the context, because it assumes that
 422 * the caller was holding the last reference to context.
 423 */
 424static void ctx_free_ctx(struct kref *kref)
 425{
 426        struct vmci_ctx *context = container_of(kref, struct vmci_ctx, kref);
 427        struct vmci_datagram_queue_entry *dq_entry, *dq_entry_tmp;
 428        struct vmci_handle temp_handle;
 429        struct vmci_handle_list *notifier, *tmp;
 430
 431        /*
 432         * Fire event to all contexts interested in knowing this
 433         * context is dying.
 434         */
 435        ctx_fire_notification(context->cid, context->priv_flags);
 436
 437        /*
 438         * Cleanup all queue pair resources attached to context.  If
 439         * the VM dies without cleaning up, this code will make sure
 440         * that no resources are leaked.
 441         */
 442        temp_handle = vmci_handle_arr_get_entry(context->queue_pair_array, 0);
 443        while (!vmci_handle_is_equal(temp_handle, VMCI_INVALID_HANDLE)) {
 444                if (vmci_qp_broker_detach(temp_handle,
 445                                          context) < VMCI_SUCCESS) {
 446                        /*
 447                         * When vmci_qp_broker_detach() succeeds it
 448                         * removes the handle from the array.  If
 449                         * detach fails, we must remove the handle
 450                         * ourselves.
 451                         */
 452                        vmci_handle_arr_remove_entry(context->queue_pair_array,
 453                                                     temp_handle);
 454                }
 455                temp_handle =
 456                    vmci_handle_arr_get_entry(context->queue_pair_array, 0);
 457        }
 458
 459        /*
 460         * It is fine to destroy this without locking the callQueue, as
 461         * this is the only thread having a reference to the context.
 462         */
 463        list_for_each_entry_safe(dq_entry, dq_entry_tmp,
 464                                 &context->datagram_queue, list_item) {
 465                WARN_ON(dq_entry->dg_size != VMCI_DG_SIZE(dq_entry->dg));
 466                list_del(&dq_entry->list_item);
 467                kfree(dq_entry->dg);
 468                kfree(dq_entry);
 469        }
 470
 471        list_for_each_entry_safe(notifier, tmp,
 472                                 &context->notifier_list, node) {
 473                list_del(&notifier->node);
 474                kfree(notifier);
 475        }
 476
 477        vmci_handle_arr_destroy(context->queue_pair_array);
 478        vmci_handle_arr_destroy(context->doorbell_array);
 479        vmci_handle_arr_destroy(context->pending_doorbell_array);
 480        vmci_ctx_unset_notify(context);
 481        if (context->cred)
 482                put_cred(context->cred);
 483        kfree(context);
 484}
 485
 486/*
 487 * Drops reference to VMCI context. If this is the last reference to
 488 * the context it will be deallocated. A context is created with
 489 * a reference count of one, and on destroy, it is removed from
 490 * the context list before its reference count is decremented. Thus,
 491 * if we reach zero, we are sure that nobody else are about to increment
 492 * it (they need the entry in the context list for that), and so there
 493 * is no need for locking.
 494 */
 495void vmci_ctx_put(struct vmci_ctx *context)
 496{
 497        kref_put(&context->kref, ctx_free_ctx);
 498}
 499
 500/*
 501 * Dequeues the next datagram and returns it to caller.
 502 * The caller passes in a pointer to the max size datagram
 503 * it can handle and the datagram is only unqueued if the
 504 * size is less than max_size. If larger max_size is set to
 505 * the size of the datagram to give the caller a chance to
 506 * set up a larger buffer for the guestcall.
 507 */
 508int vmci_ctx_dequeue_datagram(struct vmci_ctx *context,
 509                              size_t *max_size,
 510                              struct vmci_datagram **dg)
 511{
 512        struct vmci_datagram_queue_entry *dq_entry;
 513        struct list_head *list_item;
 514        int rv;
 515
 516        /* Dequeue the next datagram entry. */
 517        spin_lock(&context->lock);
 518        if (context->pending_datagrams == 0) {
 519                ctx_clear_notify_call(context);
 520                spin_unlock(&context->lock);
 521                pr_devel("No datagrams pending\n");
 522                return VMCI_ERROR_NO_MORE_DATAGRAMS;
 523        }
 524
 525        list_item = context->datagram_queue.next;
 526
 527        dq_entry =
 528            list_entry(list_item, struct vmci_datagram_queue_entry, list_item);
 529
 530        /* Check size of caller's buffer. */
 531        if (*max_size < dq_entry->dg_size) {
 532                *max_size = dq_entry->dg_size;
 533                spin_unlock(&context->lock);
 534                pr_devel("Caller's buffer should be at least (size=%u bytes)\n",
 535                         (u32) *max_size);
 536                return VMCI_ERROR_NO_MEM;
 537        }
 538
 539        list_del(list_item);
 540        context->pending_datagrams--;
 541        context->datagram_queue_size -= dq_entry->dg_size;
 542        if (context->pending_datagrams == 0) {
 543                ctx_clear_notify_call(context);
 544                rv = VMCI_SUCCESS;
 545        } else {
 546                /*
 547                 * Return the size of the next datagram.
 548                 */
 549                struct vmci_datagram_queue_entry *next_entry;
 550
 551                list_item = context->datagram_queue.next;
 552                next_entry =
 553                    list_entry(list_item, struct vmci_datagram_queue_entry,
 554                               list_item);
 555
 556                /*
 557                 * The following size_t -> int truncation is fine as
 558                 * the maximum size of a (routable) datagram is 68KB.
 559                 */
 560                rv = (int)next_entry->dg_size;
 561        }
 562        spin_unlock(&context->lock);
 563
 564        /* Caller must free datagram. */
 565        *dg = dq_entry->dg;
 566        dq_entry->dg = NULL;
 567        kfree(dq_entry);
 568
 569        return rv;
 570}
 571
 572/*
 573 * Reverts actions set up by vmci_setup_notify().  Unmaps and unlocks the
 574 * page mapped/locked by vmci_setup_notify().
 575 */
 576void vmci_ctx_unset_notify(struct vmci_ctx *context)
 577{
 578        struct page *notify_page;
 579
 580        spin_lock(&context->lock);
 581
 582        notify_page = context->notify_page;
 583        context->notify = &ctx_dummy_notify;
 584        context->notify_page = NULL;
 585
 586        spin_unlock(&context->lock);
 587
 588        if (notify_page) {
 589                kunmap(notify_page);
 590                put_page(notify_page);
 591        }
 592}
 593
 594/*
 595 * Add remote_cid to list of contexts current contexts wants
 596 * notifications from/about.
 597 */
 598int vmci_ctx_add_notification(u32 context_id, u32 remote_cid)
 599{
 600        struct vmci_ctx *context;
 601        struct vmci_handle_list *notifier, *n;
 602        int result;
 603        bool exists = false;
 604
 605        context = vmci_ctx_get(context_id);
 606        if (!context)
 607                return VMCI_ERROR_NOT_FOUND;
 608
 609        if (VMCI_CONTEXT_IS_VM(context_id) && VMCI_CONTEXT_IS_VM(remote_cid)) {
 610                pr_devel("Context removed notifications for other VMs not supported (src=0x%x, remote=0x%x)\n",
 611                         context_id, remote_cid);
 612                result = VMCI_ERROR_DST_UNREACHABLE;
 613                goto out;
 614        }
 615
 616        if (context->priv_flags & VMCI_PRIVILEGE_FLAG_RESTRICTED) {
 617                result = VMCI_ERROR_NO_ACCESS;
 618                goto out;
 619        }
 620
 621        notifier = kmalloc(sizeof(struct vmci_handle_list), GFP_KERNEL);
 622        if (!notifier) {
 623                result = VMCI_ERROR_NO_MEM;
 624                goto out;
 625        }
 626
 627        INIT_LIST_HEAD(&notifier->node);
 628        notifier->handle = vmci_make_handle(remote_cid, VMCI_EVENT_HANDLER);
 629
 630        spin_lock(&context->lock);
 631
 632        if (context->n_notifiers < VMCI_MAX_CONTEXTS) {
 633                list_for_each_entry(n, &context->notifier_list, node) {
 634                        if (vmci_handle_is_equal(n->handle, notifier->handle)) {
 635                                exists = true;
 636                                break;
 637                        }
 638                }
 639
 640                if (exists) {
 641                        kfree(notifier);
 642                        result = VMCI_ERROR_ALREADY_EXISTS;
 643                } else {
 644                        list_add_tail_rcu(&notifier->node,
 645                                          &context->notifier_list);
 646                        context->n_notifiers++;
 647                        result = VMCI_SUCCESS;
 648                }
 649        } else {
 650                kfree(notifier);
 651                result = VMCI_ERROR_NO_MEM;
 652        }
 653
 654        spin_unlock(&context->lock);
 655
 656 out:
 657        vmci_ctx_put(context);
 658        return result;
 659}
 660
 661/*
 662 * Remove remote_cid from current context's list of contexts it is
 663 * interested in getting notifications from/about.
 664 */
 665int vmci_ctx_remove_notification(u32 context_id, u32 remote_cid)
 666{
 667        struct vmci_ctx *context;
 668        struct vmci_handle_list *notifier, *tmp;
 669        struct vmci_handle handle;
 670        bool found = false;
 671
 672        context = vmci_ctx_get(context_id);
 673        if (!context)
 674                return VMCI_ERROR_NOT_FOUND;
 675
 676        handle = vmci_make_handle(remote_cid, VMCI_EVENT_HANDLER);
 677
 678        spin_lock(&context->lock);
 679        list_for_each_entry_safe(notifier, tmp,
 680                                 &context->notifier_list, node) {
 681                if (vmci_handle_is_equal(notifier->handle, handle)) {
 682                        list_del_rcu(&notifier->node);
 683                        context->n_notifiers--;
 684                        found = true;
 685                        break;
 686                }
 687        }
 688        spin_unlock(&context->lock);
 689
 690        if (found) {
 691                synchronize_rcu();
 692                kfree(notifier);
 693        }
 694
 695        vmci_ctx_put(context);
 696
 697        return found ? VMCI_SUCCESS : VMCI_ERROR_NOT_FOUND;
 698}
 699
 700static int vmci_ctx_get_chkpt_notifiers(struct vmci_ctx *context,
 701                                        u32 *buf_size, void **pbuf)
 702{
 703        u32 *notifiers;
 704        size_t data_size;
 705        struct vmci_handle_list *entry;
 706        int i = 0;
 707
 708        if (context->n_notifiers == 0) {
 709                *buf_size = 0;
 710                *pbuf = NULL;
 711                return VMCI_SUCCESS;
 712        }
 713
 714        data_size = context->n_notifiers * sizeof(*notifiers);
 715        if (*buf_size < data_size) {
 716                *buf_size = data_size;
 717                return VMCI_ERROR_MORE_DATA;
 718        }
 719
 720        notifiers = kmalloc(data_size, GFP_ATOMIC); /* FIXME: want GFP_KERNEL */
 721        if (!notifiers)
 722                return VMCI_ERROR_NO_MEM;
 723
 724        list_for_each_entry(entry, &context->notifier_list, node)
 725                notifiers[i++] = entry->handle.context;
 726
 727        *buf_size = data_size;
 728        *pbuf = notifiers;
 729        return VMCI_SUCCESS;
 730}
 731
 732static int vmci_ctx_get_chkpt_doorbells(struct vmci_ctx *context,
 733                                        u32 *buf_size, void **pbuf)
 734{
 735        struct dbell_cpt_state *dbells;
 736        u32 i, n_doorbells;
 737
 738        n_doorbells = vmci_handle_arr_get_size(context->doorbell_array);
 739        if (n_doorbells > 0) {
 740                size_t data_size = n_doorbells * sizeof(*dbells);
 741                if (*buf_size < data_size) {
 742                        *buf_size = data_size;
 743                        return VMCI_ERROR_MORE_DATA;
 744                }
 745
 746                dbells = kmalloc(data_size, GFP_ATOMIC);
 747                if (!dbells)
 748                        return VMCI_ERROR_NO_MEM;
 749
 750                for (i = 0; i < n_doorbells; i++)
 751                        dbells[i].handle = vmci_handle_arr_get_entry(
 752                                                context->doorbell_array, i);
 753
 754                *buf_size = data_size;
 755                *pbuf = dbells;
 756        } else {
 757                *buf_size = 0;
 758                *pbuf = NULL;
 759        }
 760
 761        return VMCI_SUCCESS;
 762}
 763
 764/*
 765 * Get current context's checkpoint state of given type.
 766 */
 767int vmci_ctx_get_chkpt_state(u32 context_id,
 768                             u32 cpt_type,
 769                             u32 *buf_size,
 770                             void **pbuf)
 771{
 772        struct vmci_ctx *context;
 773        int result;
 774
 775        context = vmci_ctx_get(context_id);
 776        if (!context)
 777                return VMCI_ERROR_NOT_FOUND;
 778
 779        spin_lock(&context->lock);
 780
 781        switch (cpt_type) {
 782        case VMCI_NOTIFICATION_CPT_STATE:
 783                result = vmci_ctx_get_chkpt_notifiers(context, buf_size, pbuf);
 784                break;
 785
 786        case VMCI_WELLKNOWN_CPT_STATE:
 787                /*
 788                 * For compatibility with VMX'en with VM to VM communication, we
 789                 * always return zero wellknown handles.
 790                 */
 791
 792                *buf_size = 0;
 793                *pbuf = NULL;
 794                result = VMCI_SUCCESS;
 795                break;
 796
 797        case VMCI_DOORBELL_CPT_STATE:
 798                result = vmci_ctx_get_chkpt_doorbells(context, buf_size, pbuf);
 799                break;
 800
 801        default:
 802                pr_devel("Invalid cpt state (type=%d)\n", cpt_type);
 803                result = VMCI_ERROR_INVALID_ARGS;
 804                break;
 805        }
 806
 807        spin_unlock(&context->lock);
 808        vmci_ctx_put(context);
 809
 810        return result;
 811}
 812
 813/*
 814 * Set current context's checkpoint state of given type.
 815 */
 816int vmci_ctx_set_chkpt_state(u32 context_id,
 817                             u32 cpt_type,
 818                             u32 buf_size,
 819                             void *cpt_buf)
 820{
 821        u32 i;
 822        u32 current_id;
 823        int result = VMCI_SUCCESS;
 824        u32 num_ids = buf_size / sizeof(u32);
 825
 826        if (cpt_type == VMCI_WELLKNOWN_CPT_STATE && num_ids > 0) {
 827                /*
 828                 * We would end up here if VMX with VM to VM communication
 829                 * attempts to restore a checkpoint with wellknown handles.
 830                 */
 831                pr_warn("Attempt to restore checkpoint with obsolete wellknown handles\n");
 832                return VMCI_ERROR_OBSOLETE;
 833        }
 834
 835        if (cpt_type != VMCI_NOTIFICATION_CPT_STATE) {
 836                pr_devel("Invalid cpt state (type=%d)\n", cpt_type);
 837                return VMCI_ERROR_INVALID_ARGS;
 838        }
 839
 840        for (i = 0; i < num_ids && result == VMCI_SUCCESS; i++) {
 841                current_id = ((u32 *)cpt_buf)[i];
 842                result = vmci_ctx_add_notification(context_id, current_id);
 843                if (result != VMCI_SUCCESS)
 844                        break;
 845        }
 846        if (result != VMCI_SUCCESS)
 847                pr_devel("Failed to set cpt state (type=%d) (error=%d)\n",
 848                         cpt_type, result);
 849
 850        return result;
 851}
 852
 853/*
 854 * Retrieves the specified context's pending notifications in the
 855 * form of a handle array. The handle arrays returned are the
 856 * actual data - not a copy and should not be modified by the
 857 * caller. They must be released using
 858 * vmci_ctx_rcv_notifications_release.
 859 */
 860int vmci_ctx_rcv_notifications_get(u32 context_id,
 861                                   struct vmci_handle_arr **db_handle_array,
 862                                   struct vmci_handle_arr **qp_handle_array)
 863{
 864        struct vmci_ctx *context;
 865        int result = VMCI_SUCCESS;
 866
 867        context = vmci_ctx_get(context_id);
 868        if (context == NULL)
 869                return VMCI_ERROR_NOT_FOUND;
 870
 871        spin_lock(&context->lock);
 872
 873        *db_handle_array = context->pending_doorbell_array;
 874        context->pending_doorbell_array =
 875                vmci_handle_arr_create(0, VMCI_MAX_GUEST_DOORBELL_COUNT);
 876        if (!context->pending_doorbell_array) {
 877                context->pending_doorbell_array = *db_handle_array;
 878                *db_handle_array = NULL;
 879                result = VMCI_ERROR_NO_MEM;
 880        }
 881        *qp_handle_array = NULL;
 882
 883        spin_unlock(&context->lock);
 884        vmci_ctx_put(context);
 885
 886        return result;
 887}
 888
 889/*
 890 * Releases handle arrays with pending notifications previously
 891 * retrieved using vmci_ctx_rcv_notifications_get. If the
 892 * notifications were not successfully handed over to the guest,
 893 * success must be false.
 894 */
 895void vmci_ctx_rcv_notifications_release(u32 context_id,
 896                                        struct vmci_handle_arr *db_handle_array,
 897                                        struct vmci_handle_arr *qp_handle_array,
 898                                        bool success)
 899{
 900        struct vmci_ctx *context = vmci_ctx_get(context_id);
 901
 902        spin_lock(&context->lock);
 903        if (!success) {
 904                struct vmci_handle handle;
 905
 906                /*
 907                 * New notifications may have been added while we were not
 908                 * holding the context lock, so we transfer any new pending
 909                 * doorbell notifications to the old array, and reinstate the
 910                 * old array.
 911                 */
 912
 913                handle = vmci_handle_arr_remove_tail(
 914                                        context->pending_doorbell_array);
 915                while (!vmci_handle_is_invalid(handle)) {
 916                        if (!vmci_handle_arr_has_entry(db_handle_array,
 917                                                       handle)) {
 918                                vmci_handle_arr_append_entry(
 919                                                &db_handle_array, handle);
 920                        }
 921                        handle = vmci_handle_arr_remove_tail(
 922                                        context->pending_doorbell_array);
 923                }
 924                vmci_handle_arr_destroy(context->pending_doorbell_array);
 925                context->pending_doorbell_array = db_handle_array;
 926                db_handle_array = NULL;
 927        } else {
 928                ctx_clear_notify_call(context);
 929        }
 930        spin_unlock(&context->lock);
 931        vmci_ctx_put(context);
 932
 933        if (db_handle_array)
 934                vmci_handle_arr_destroy(db_handle_array);
 935
 936        if (qp_handle_array)
 937                vmci_handle_arr_destroy(qp_handle_array);
 938}
 939
 940/*
 941 * Registers that a new doorbell handle has been allocated by the
 942 * context. Only doorbell handles registered can be notified.
 943 */
 944int vmci_ctx_dbell_create(u32 context_id, struct vmci_handle handle)
 945{
 946        struct vmci_ctx *context;
 947        int result;
 948
 949        if (context_id == VMCI_INVALID_ID || vmci_handle_is_invalid(handle))
 950                return VMCI_ERROR_INVALID_ARGS;
 951
 952        context = vmci_ctx_get(context_id);
 953        if (context == NULL)
 954                return VMCI_ERROR_NOT_FOUND;
 955
 956        spin_lock(&context->lock);
 957        if (!vmci_handle_arr_has_entry(context->doorbell_array, handle))
 958                result = vmci_handle_arr_append_entry(&context->doorbell_array,
 959                                                      handle);
 960        else
 961                result = VMCI_ERROR_DUPLICATE_ENTRY;
 962
 963        spin_unlock(&context->lock);
 964        vmci_ctx_put(context);
 965
 966        return result;
 967}
 968
 969/*
 970 * Unregisters a doorbell handle that was previously registered
 971 * with vmci_ctx_dbell_create.
 972 */
 973int vmci_ctx_dbell_destroy(u32 context_id, struct vmci_handle handle)
 974{
 975        struct vmci_ctx *context;
 976        struct vmci_handle removed_handle;
 977
 978        if (context_id == VMCI_INVALID_ID || vmci_handle_is_invalid(handle))
 979                return VMCI_ERROR_INVALID_ARGS;
 980
 981        context = vmci_ctx_get(context_id);
 982        if (context == NULL)
 983                return VMCI_ERROR_NOT_FOUND;
 984
 985        spin_lock(&context->lock);
 986        removed_handle =
 987            vmci_handle_arr_remove_entry(context->doorbell_array, handle);
 988        vmci_handle_arr_remove_entry(context->pending_doorbell_array, handle);
 989        spin_unlock(&context->lock);
 990
 991        vmci_ctx_put(context);
 992
 993        return vmci_handle_is_invalid(removed_handle) ?
 994            VMCI_ERROR_NOT_FOUND : VMCI_SUCCESS;
 995}
 996
 997/*
 998 * Unregisters all doorbell handles that were previously
 999 * registered with vmci_ctx_dbell_create.
1000 */
1001int vmci_ctx_dbell_destroy_all(u32 context_id)
1002{
1003        struct vmci_ctx *context;
1004        struct vmci_handle handle;
1005
1006        if (context_id == VMCI_INVALID_ID)
1007                return VMCI_ERROR_INVALID_ARGS;
1008
1009        context = vmci_ctx_get(context_id);
1010        if (context == NULL)
1011                return VMCI_ERROR_NOT_FOUND;
1012
1013        spin_lock(&context->lock);
1014        do {
1015                struct vmci_handle_arr *arr = context->doorbell_array;
1016                handle = vmci_handle_arr_remove_tail(arr);
1017        } while (!vmci_handle_is_invalid(handle));
1018        do {
1019                struct vmci_handle_arr *arr = context->pending_doorbell_array;
1020                handle = vmci_handle_arr_remove_tail(arr);
1021        } while (!vmci_handle_is_invalid(handle));
1022        spin_unlock(&context->lock);
1023
1024        vmci_ctx_put(context);
1025
1026        return VMCI_SUCCESS;
1027}
1028
1029/*
1030 * Registers a notification of a doorbell handle initiated by the
1031 * specified source context. The notification of doorbells are
1032 * subject to the same isolation rules as datagram delivery. To
1033 * allow host side senders of notifications a finer granularity
1034 * of sender rights than those assigned to the sending context
1035 * itself, the host context is required to specify a different
1036 * set of privilege flags that will override the privileges of
1037 * the source context.
1038 */
1039int vmci_ctx_notify_dbell(u32 src_cid,
1040                          struct vmci_handle handle,
1041                          u32 src_priv_flags)
1042{
1043        struct vmci_ctx *dst_context;
1044        int result;
1045
1046        if (vmci_handle_is_invalid(handle))
1047                return VMCI_ERROR_INVALID_ARGS;
1048
1049        /* Get the target VM's VMCI context. */
1050        dst_context = vmci_ctx_get(handle.context);
1051        if (!dst_context) {
1052                pr_devel("Invalid context (ID=0x%x)\n", handle.context);
1053                return VMCI_ERROR_NOT_FOUND;
1054        }
1055
1056        if (src_cid != handle.context) {
1057                u32 dst_priv_flags;
1058
1059                if (VMCI_CONTEXT_IS_VM(src_cid) &&
1060                    VMCI_CONTEXT_IS_VM(handle.context)) {
1061                        pr_devel("Doorbell notification from VM to VM not supported (src=0x%x, dst=0x%x)\n",
1062                                 src_cid, handle.context);
1063                        result = VMCI_ERROR_DST_UNREACHABLE;
1064                        goto out;
1065                }
1066
1067                result = vmci_dbell_get_priv_flags(handle, &dst_priv_flags);
1068                if (result < VMCI_SUCCESS) {
1069                        pr_warn("Failed to get privilege flags for destination (handle=0x%x:0x%x)\n",
1070                                handle.context, handle.resource);
1071                        goto out;
1072                }
1073
1074                if (src_cid != VMCI_HOST_CONTEXT_ID ||
1075                    src_priv_flags == VMCI_NO_PRIVILEGE_FLAGS) {
1076                        src_priv_flags = vmci_context_get_priv_flags(src_cid);
1077                }
1078
1079                if (vmci_deny_interaction(src_priv_flags, dst_priv_flags)) {
1080                        result = VMCI_ERROR_NO_ACCESS;
1081                        goto out;
1082                }
1083        }
1084
1085        if (handle.context == VMCI_HOST_CONTEXT_ID) {
1086                result = vmci_dbell_host_context_notify(src_cid, handle);
1087        } else {
1088                spin_lock(&dst_context->lock);
1089
1090                if (!vmci_handle_arr_has_entry(dst_context->doorbell_array,
1091                                               handle)) {
1092                        result = VMCI_ERROR_NOT_FOUND;
1093                } else {
1094                        if (!vmci_handle_arr_has_entry(
1095                                        dst_context->pending_doorbell_array,
1096                                        handle)) {
1097                                result = vmci_handle_arr_append_entry(
1098                                        &dst_context->pending_doorbell_array,
1099                                        handle);
1100                                if (result == VMCI_SUCCESS) {
1101                                        ctx_signal_notify(dst_context);
1102                                        wake_up(&dst_context->host_context.wait_queue);
1103                                }
1104                        } else {
1105                                result = VMCI_SUCCESS;
1106                        }
1107                }
1108                spin_unlock(&dst_context->lock);
1109        }
1110
1111 out:
1112        vmci_ctx_put(dst_context);
1113
1114        return result;
1115}
1116
1117bool vmci_ctx_supports_host_qp(struct vmci_ctx *context)
1118{
1119        return context && context->user_version >= VMCI_VERSION_HOSTQP;
1120}
1121
1122/*
1123 * Registers that a new queue pair handle has been allocated by
1124 * the context.
1125 */
1126int vmci_ctx_qp_create(struct vmci_ctx *context, struct vmci_handle handle)
1127{
1128        int result;
1129
1130        if (context == NULL || vmci_handle_is_invalid(handle))
1131                return VMCI_ERROR_INVALID_ARGS;
1132
1133        if (!vmci_handle_arr_has_entry(context->queue_pair_array, handle))
1134                result = vmci_handle_arr_append_entry(
1135                        &context->queue_pair_array, handle);
1136        else
1137                result = VMCI_ERROR_DUPLICATE_ENTRY;
1138
1139        return result;
1140}
1141
1142/*
1143 * Unregisters a queue pair handle that was previously registered
1144 * with vmci_ctx_qp_create.
1145 */
1146int vmci_ctx_qp_destroy(struct vmci_ctx *context, struct vmci_handle handle)
1147{
1148        struct vmci_handle hndl;
1149
1150        if (context == NULL || vmci_handle_is_invalid(handle))
1151                return VMCI_ERROR_INVALID_ARGS;
1152
1153        hndl = vmci_handle_arr_remove_entry(context->queue_pair_array, handle);
1154
1155        return vmci_handle_is_invalid(hndl) ?
1156                VMCI_ERROR_NOT_FOUND : VMCI_SUCCESS;
1157}
1158
1159/*
1160 * Determines whether a given queue pair handle is registered
1161 * with the given context.
1162 */
1163bool vmci_ctx_qp_exists(struct vmci_ctx *context, struct vmci_handle handle)
1164{
1165        if (context == NULL || vmci_handle_is_invalid(handle))
1166                return false;
1167
1168        return vmci_handle_arr_has_entry(context->queue_pair_array, handle);
1169}
1170
1171/*
1172 * vmci_context_get_priv_flags() - Retrieve privilege flags.
1173 * @context_id: The context ID of the VMCI context.
1174 *
1175 * Retrieves privilege flags of the given VMCI context ID.
1176 */
1177u32 vmci_context_get_priv_flags(u32 context_id)
1178{
1179        if (vmci_host_code_active()) {
1180                u32 flags;
1181                struct vmci_ctx *context;
1182
1183                context = vmci_ctx_get(context_id);
1184                if (!context)
1185                        return VMCI_LEAST_PRIVILEGE_FLAGS;
1186
1187                flags = context->priv_flags;
1188                vmci_ctx_put(context);
1189                return flags;
1190        }
1191        return VMCI_NO_PRIVILEGE_FLAGS;
1192}
1193EXPORT_SYMBOL_GPL(vmci_context_get_priv_flags);
1194
1195/*
1196 * vmci_is_context_owner() - Determimnes if user is the context owner
1197 * @context_id: The context ID of the VMCI context.
1198 * @uid:        The host user id (real kernel value).
1199 *
1200 * Determines whether a given UID is the owner of given VMCI context.
1201 */
1202bool vmci_is_context_owner(u32 context_id, kuid_t uid)
1203{
1204        bool is_owner = false;
1205
1206        if (vmci_host_code_active()) {
1207                struct vmci_ctx *context = vmci_ctx_get(context_id);
1208                if (context) {
1209                        if (context->cred)
1210                                is_owner = uid_eq(context->cred->uid, uid);
1211                        vmci_ctx_put(context);
1212                }
1213        }
1214
1215        return is_owner;
1216}
1217EXPORT_SYMBOL_GPL(vmci_is_context_owner);
1218