1 #ifndef _HFI1_USER_SDMA_H 2 #define _HFI1_USER_SDMA_H 3 /* 4 * Copyright(c) 2015 - 2018 Intel Corporation. 5 * 6 * This file is provided under a dual BSD/GPLv2 license. When using or 7 * redistributing this file, you may do so under either license. 8 * 9 * GPL LICENSE SUMMARY 10 * 11 * This program is free software; you can redistribute it and/or modify 12 * it under the terms of version 2 of the GNU General Public License as 13 * published by the Free Software Foundation. 14 * 15 * This program is distributed in the hope that it will be useful, but 16 * WITHOUT ANY WARRANTY; without even the implied warranty of 17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 18 * General Public License for more details. 19 * 20 * BSD LICENSE 21 * 22 * Redistribution and use in source and binary forms, with or without 23 * modification, are permitted provided that the following conditions 24 * are met: 25 * 26 * - Redistributions of source code must retain the above copyright 27 * notice, this list of conditions and the following disclaimer. 28 * - Redistributions in binary form must reproduce the above copyright 29 * notice, this list of conditions and the following disclaimer in 30 * the documentation and/or other materials provided with the 31 * distribution. 32 * - Neither the name of Intel Corporation nor the names of its 33 * contributors may be used to endorse or promote products derived 34 * from this software without specific prior written permission. 35 * 36 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 37 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 38 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 39 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 40 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 41 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 42 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 43 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 44 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 45 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 46 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 47 * 48 */ 49 #include <linux/device.h> 50 #include <linux/wait.h> 51 52 #include "common.h" 53 #include "iowait.h" 54 #include "user_exp_rcv.h" 55 56 /* The maximum number of Data io vectors per message/request */ 57 #define MAX_VECTORS_PER_REQ 8 58 /* 59 * Maximum number of packet to send from each message/request 60 * before moving to the next one. 61 */ 62 #define MAX_PKTS_PER_QUEUE 16 63 64 #define num_pages(x) (1 + ((((x) - 1) & PAGE_MASK) >> PAGE_SHIFT)) 65 66 #define req_opcode(x) \ 67 (((x) >> HFI1_SDMA_REQ_OPCODE_SHIFT) & HFI1_SDMA_REQ_OPCODE_MASK) 68 #define req_version(x) \ 69 (((x) >> HFI1_SDMA_REQ_VERSION_SHIFT) & HFI1_SDMA_REQ_OPCODE_MASK) 70 #define req_iovcnt(x) \ 71 (((x) >> HFI1_SDMA_REQ_IOVCNT_SHIFT) & HFI1_SDMA_REQ_IOVCNT_MASK) 72 73 /* Number of BTH.PSN bits used for sequence number in expected rcvs */ 74 #define BTH_SEQ_MASK 0x7ffull 75 76 #define AHG_KDETH_INTR_SHIFT 12 77 #define AHG_KDETH_SH_SHIFT 13 78 #define AHG_KDETH_ARRAY_SIZE 9 79 80 #define PBC2LRH(x) ((((x) & 0xfff) << 2) - 4) 81 #define LRH2PBC(x) ((((x) >> 2) + 1) & 0xfff) 82 83 /** 84 * Build an SDMA AHG header update descriptor and save it to an array. 85 * @arr - Array to save the descriptor to. 86 * @idx - Index of the array at which the descriptor will be saved. 87 * @array_size - Size of the array arr. 88 * @dw - Update index into the header in DWs. 89 * @bit - Start bit. 90 * @width - Field width. 91 * @value - 16 bits of immediate data to write into the field. 92 * Returns -ERANGE if idx is invalid. If successful, returns the next index 93 * (idx + 1) of the array to be used for the next descriptor. 94 */ 95 static inline int ahg_header_set(u32 *arr, int idx, size_t array_size, 96 u8 dw, u8 bit, u8 width, u16 value) 97 { 98 if ((size_t)idx >= array_size) 99 return -ERANGE; 100 arr[idx++] = sdma_build_ahg_descriptor(value, dw, bit, width); 101 return idx; 102 } 103 104 /* Tx request flag bits */ 105 #define TXREQ_FLAGS_REQ_ACK BIT(0) /* Set the ACK bit in the header */ 106 #define TXREQ_FLAGS_REQ_DISABLE_SH BIT(1) /* Disable header suppression */ 107 108 #define SDMA_PKT_Q_INACTIVE BIT(0) 109 #define SDMA_PKT_Q_ACTIVE BIT(1) 110 #define SDMA_PKT_Q_DEFERRED BIT(2) 111 112 /* 113 * Maximum retry attempts to submit a TX request 114 * before putting the process to sleep. 115 */ 116 #define MAX_DEFER_RETRY_COUNT 1 117 118 #define SDMA_IOWAIT_TIMEOUT 1000 /* in milliseconds */ 119 120 #define SDMA_DBG(req, fmt, ...) \ 121 hfi1_cdbg(SDMA, "[%u:%u:%u:%u] " fmt, (req)->pq->dd->unit, \ 122 (req)->pq->ctxt, (req)->pq->subctxt, (req)->info.comp_idx, \ 123 ##__VA_ARGS__) 124 125 struct hfi1_user_sdma_pkt_q { 126 u16 ctxt; 127 u16 subctxt; 128 u16 n_max_reqs; 129 atomic_t n_reqs; 130 u16 reqidx; 131 struct hfi1_devdata *dd; 132 struct kmem_cache *txreq_cache; 133 struct user_sdma_request *reqs; 134 unsigned long *req_in_use; 135 struct iowait busy; 136 unsigned state; 137 wait_queue_head_t wait; 138 unsigned long unpinned; 139 struct mmu_rb_handler *handler; 140 atomic_t n_locked; 141 struct mm_struct *mm; 142 }; 143 144 struct hfi1_user_sdma_comp_q { 145 u16 nentries; 146 struct hfi1_sdma_comp_entry *comps; 147 }; 148 149 struct sdma_mmu_node { 150 struct mmu_rb_node rb; 151 struct hfi1_user_sdma_pkt_q *pq; 152 atomic_t refcount; 153 struct page **pages; 154 unsigned int npages; 155 }; 156 157 struct user_sdma_iovec { 158 struct list_head list; 159 struct iovec iov; 160 /* number of pages in this vector */ 161 unsigned int npages; 162 /* array of pinned pages for this vector */ 163 struct page **pages; 164 /* 165 * offset into the virtual address space of the vector at 166 * which we last left off. 167 */ 168 u64 offset; 169 struct sdma_mmu_node *node; 170 }; 171 172 /* evict operation argument */ 173 struct evict_data { 174 u32 cleared; /* count evicted so far */ 175 u32 target; /* target count to evict */ 176 }; 177 178 struct user_sdma_request { 179 /* This is the original header from user space */ 180 struct hfi1_pkt_header hdr; 181 182 /* Read mostly fields */ 183 struct hfi1_user_sdma_pkt_q *pq ____cacheline_aligned_in_smp; 184 struct hfi1_user_sdma_comp_q *cq; 185 /* 186 * Pointer to the SDMA engine for this request. 187 * Since different request could be on different VLs, 188 * each request will need it's own engine pointer. 189 */ 190 struct sdma_engine *sde; 191 struct sdma_req_info info; 192 /* TID array values copied from the tid_iov vector */ 193 u32 *tids; 194 /* total length of the data in the request */ 195 u32 data_len; 196 /* number of elements copied to the tids array */ 197 u16 n_tids; 198 /* 199 * We copy the iovs for this request (based on 200 * info.iovcnt). These are only the data vectors 201 */ 202 u8 data_iovs; 203 s8 ahg_idx; 204 205 /* Writeable fields shared with interrupt */ 206 u64 seqcomp ____cacheline_aligned_in_smp; 207 u64 seqsubmitted; 208 /* status of the last txreq completed */ 209 int status; 210 211 /* Send side fields */ 212 struct list_head txps ____cacheline_aligned_in_smp; 213 u64 seqnum; 214 /* 215 * KDETH.OFFSET (TID) field 216 * The offset can cover multiple packets, depending on the 217 * size of the TID entry. 218 */ 219 u32 tidoffset; 220 /* 221 * KDETH.Offset (Eager) field 222 * We need to remember the initial value so the headers 223 * can be updated properly. 224 */ 225 u32 koffset; 226 u32 sent; 227 /* TID index copied from the tid_iov vector */ 228 u16 tididx; 229 /* progress index moving along the iovs array */ 230 u8 iov_idx; 231 u8 done; 232 u8 has_error; 233 234 struct user_sdma_iovec iovs[MAX_VECTORS_PER_REQ]; 235 } ____cacheline_aligned_in_smp; 236 237 /* 238 * A single txreq could span up to 3 physical pages when the MTU 239 * is sufficiently large (> 4K). Each of the IOV pointers also 240 * needs it's own set of flags so the vector has been handled 241 * independently of each other. 242 */ 243 struct user_sdma_txreq { 244 /* Packet header for the txreq */ 245 struct hfi1_pkt_header hdr; 246 struct sdma_txreq txreq; 247 struct list_head list; 248 struct user_sdma_request *req; 249 u16 flags; 250 unsigned int busycount; 251 u64 seqnum; 252 }; 253 254 int hfi1_user_sdma_alloc_queues(struct hfi1_ctxtdata *uctxt, 255 struct hfi1_filedata *fd); 256 int hfi1_user_sdma_free_queues(struct hfi1_filedata *fd, 257 struct hfi1_ctxtdata *uctxt); 258 int hfi1_user_sdma_process_request(struct hfi1_filedata *fd, 259 struct iovec *iovec, unsigned long dim, 260 unsigned long *count); 261 262 #endif /* _HFI1_USER_SDMA_H */ 263