linux/drivers/infiniband/hw/hfi1/user_sdma.h
<<
>>
Prefs
   1#ifndef _HFI1_USER_SDMA_H
   2#define _HFI1_USER_SDMA_H
   3/*
   4 * Copyright(c) 2015 - 2018 Intel Corporation.
   5 *
   6 * This file is provided under a dual BSD/GPLv2 license.  When using or
   7 * redistributing this file, you may do so under either license.
   8 *
   9 * GPL LICENSE SUMMARY
  10 *
  11 * This program is free software; you can redistribute it and/or modify
  12 * it under the terms of version 2 of the GNU General Public License as
  13 * published by the Free Software Foundation.
  14 *
  15 * This program is distributed in the hope that it will be useful, but
  16 * WITHOUT ANY WARRANTY; without even the implied warranty of
  17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  18 * General Public License for more details.
  19 *
  20 * BSD LICENSE
  21 *
  22 * Redistribution and use in source and binary forms, with or without
  23 * modification, are permitted provided that the following conditions
  24 * are met:
  25 *
  26 *  - Redistributions of source code must retain the above copyright
  27 *    notice, this list of conditions and the following disclaimer.
  28 *  - Redistributions in binary form must reproduce the above copyright
  29 *    notice, this list of conditions and the following disclaimer in
  30 *    the documentation and/or other materials provided with the
  31 *    distribution.
  32 *  - Neither the name of Intel Corporation nor the names of its
  33 *    contributors may be used to endorse or promote products derived
  34 *    from this software without specific prior written permission.
  35 *
  36 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  37 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  38 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  39 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  40 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  41 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  42 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  43 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  44 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  45 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  46 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  47 *
  48 */
  49#include <linux/device.h>
  50#include <linux/wait.h>
  51
  52#include "common.h"
  53#include "iowait.h"
  54#include "user_exp_rcv.h"
  55
  56/* The maximum number of Data io vectors per message/request */
  57#define MAX_VECTORS_PER_REQ 8
  58/*
  59 * Maximum number of packet to send from each message/request
  60 * before moving to the next one.
  61 */
  62#define MAX_PKTS_PER_QUEUE 16
  63
  64#define num_pages(x) (1 + ((((x) - 1) & PAGE_MASK) >> PAGE_SHIFT))
  65
  66#define req_opcode(x) \
  67        (((x) >> HFI1_SDMA_REQ_OPCODE_SHIFT) & HFI1_SDMA_REQ_OPCODE_MASK)
  68#define req_version(x) \
  69        (((x) >> HFI1_SDMA_REQ_VERSION_SHIFT) & HFI1_SDMA_REQ_OPCODE_MASK)
  70#define req_iovcnt(x) \
  71        (((x) >> HFI1_SDMA_REQ_IOVCNT_SHIFT) & HFI1_SDMA_REQ_IOVCNT_MASK)
  72
  73/* Number of BTH.PSN bits used for sequence number in expected rcvs */
  74#define BTH_SEQ_MASK 0x7ffull
  75
  76#define AHG_KDETH_INTR_SHIFT 12
  77#define AHG_KDETH_SH_SHIFT   13
  78#define AHG_KDETH_ARRAY_SIZE  9
  79
  80#define PBC2LRH(x) ((((x) & 0xfff) << 2) - 4)
  81#define LRH2PBC(x) ((((x) >> 2) + 1) & 0xfff)
  82
  83/**
  84 * Build an SDMA AHG header update descriptor and save it to an array.
  85 * @arr        - Array to save the descriptor to.
  86 * @idx        - Index of the array at which the descriptor will be saved.
  87 * @array_size - Size of the array arr.
  88 * @dw         - Update index into the header in DWs.
  89 * @bit        - Start bit.
  90 * @width      - Field width.
  91 * @value      - 16 bits of immediate data to write into the field.
  92 * Returns -ERANGE if idx is invalid. If successful, returns the next index
  93 * (idx + 1) of the array to be used for the next descriptor.
  94 */
  95static inline int ahg_header_set(u32 *arr, int idx, size_t array_size,
  96                                 u8 dw, u8 bit, u8 width, u16 value)
  97{
  98        if ((size_t)idx >= array_size)
  99                return -ERANGE;
 100        arr[idx++] = sdma_build_ahg_descriptor(value, dw, bit, width);
 101        return idx;
 102}
 103
 104/* Tx request flag bits */
 105#define TXREQ_FLAGS_REQ_ACK   BIT(0)      /* Set the ACK bit in the header */
 106#define TXREQ_FLAGS_REQ_DISABLE_SH BIT(1) /* Disable header suppression */
 107
 108enum pkt_q_sdma_state {
 109        SDMA_PKT_Q_ACTIVE,
 110        SDMA_PKT_Q_DEFERRED,
 111};
 112
 113/*
 114 * Maximum retry attempts to submit a TX request
 115 * before putting the process to sleep.
 116 */
 117#define MAX_DEFER_RETRY_COUNT 1
 118
 119#define SDMA_IOWAIT_TIMEOUT 1000 /* in milliseconds */
 120
 121#define SDMA_DBG(req, fmt, ...)                              \
 122        hfi1_cdbg(SDMA, "[%u:%u:%u:%u] " fmt, (req)->pq->dd->unit, \
 123                 (req)->pq->ctxt, (req)->pq->subctxt, (req)->info.comp_idx, \
 124                 ##__VA_ARGS__)
 125
 126struct hfi1_user_sdma_pkt_q {
 127        u16 ctxt;
 128        u16 subctxt;
 129        u16 n_max_reqs;
 130        atomic_t n_reqs;
 131        u16 reqidx;
 132        struct hfi1_devdata *dd;
 133        struct kmem_cache *txreq_cache;
 134        struct user_sdma_request *reqs;
 135        unsigned long *req_in_use;
 136        struct iowait busy;
 137        enum pkt_q_sdma_state state;
 138        wait_queue_head_t wait;
 139        unsigned long unpinned;
 140        struct mmu_rb_handler *handler;
 141        atomic_t n_locked;
 142        struct mm_struct *mm;
 143};
 144
 145struct hfi1_user_sdma_comp_q {
 146        u16 nentries;
 147        struct hfi1_sdma_comp_entry *comps;
 148};
 149
 150struct sdma_mmu_node {
 151        struct mmu_rb_node rb;
 152        struct hfi1_user_sdma_pkt_q *pq;
 153        atomic_t refcount;
 154        struct page **pages;
 155        unsigned int npages;
 156};
 157
 158struct user_sdma_iovec {
 159        struct list_head list;
 160        struct iovec iov;
 161        /* number of pages in this vector */
 162        unsigned int npages;
 163        /* array of pinned pages for this vector */
 164        struct page **pages;
 165        /*
 166         * offset into the virtual address space of the vector at
 167         * which we last left off.
 168         */
 169        u64 offset;
 170        struct sdma_mmu_node *node;
 171};
 172
 173/* evict operation argument */
 174struct evict_data {
 175        u32 cleared;    /* count evicted so far */
 176        u32 target;     /* target count to evict */
 177};
 178
 179struct user_sdma_request {
 180        /* This is the original header from user space */
 181        struct hfi1_pkt_header hdr;
 182
 183        /* Read mostly fields */
 184        struct hfi1_user_sdma_pkt_q *pq ____cacheline_aligned_in_smp;
 185        struct hfi1_user_sdma_comp_q *cq;
 186        /*
 187         * Pointer to the SDMA engine for this request.
 188         * Since different request could be on different VLs,
 189         * each request will need it's own engine pointer.
 190         */
 191        struct sdma_engine *sde;
 192        struct sdma_req_info info;
 193        /* TID array values copied from the tid_iov vector */
 194        u32 *tids;
 195        /* total length of the data in the request */
 196        u32 data_len;
 197        /* number of elements copied to the tids array */
 198        u16 n_tids;
 199        /*
 200         * We copy the iovs for this request (based on
 201         * info.iovcnt). These are only the data vectors
 202         */
 203        u8 data_iovs;
 204        s8 ahg_idx;
 205
 206        /* Writeable fields shared with interrupt */
 207        u16 seqcomp ____cacheline_aligned_in_smp;
 208        u16 seqsubmitted;
 209
 210        /* Send side fields */
 211        struct list_head txps ____cacheline_aligned_in_smp;
 212        u16 seqnum;
 213        /*
 214         * KDETH.OFFSET (TID) field
 215         * The offset can cover multiple packets, depending on the
 216         * size of the TID entry.
 217         */
 218        u32 tidoffset;
 219        /*
 220         * KDETH.Offset (Eager) field
 221         * We need to remember the initial value so the headers
 222         * can be updated properly.
 223         */
 224        u32 koffset;
 225        u32 sent;
 226        /* TID index copied from the tid_iov vector */
 227        u16 tididx;
 228        /* progress index moving along the iovs array */
 229        u8 iov_idx;
 230        u8 has_error;
 231
 232        struct user_sdma_iovec iovs[MAX_VECTORS_PER_REQ];
 233} ____cacheline_aligned_in_smp;
 234
 235/*
 236 * A single txreq could span up to 3 physical pages when the MTU
 237 * is sufficiently large (> 4K). Each of the IOV pointers also
 238 * needs it's own set of flags so the vector has been handled
 239 * independently of each other.
 240 */
 241struct user_sdma_txreq {
 242        /* Packet header for the txreq */
 243        struct hfi1_pkt_header hdr;
 244        struct sdma_txreq txreq;
 245        struct list_head list;
 246        struct user_sdma_request *req;
 247        u16 flags;
 248        u16 seqnum;
 249};
 250
 251int hfi1_user_sdma_alloc_queues(struct hfi1_ctxtdata *uctxt,
 252                                struct hfi1_filedata *fd);
 253int hfi1_user_sdma_free_queues(struct hfi1_filedata *fd,
 254                               struct hfi1_ctxtdata *uctxt);
 255int hfi1_user_sdma_process_request(struct hfi1_filedata *fd,
 256                                   struct iovec *iovec, unsigned long dim,
 257                                   unsigned long *count);
 258
 259#endif /* _HFI1_USER_SDMA_H */
 260