mem.c revision 297124
1256694Snp/* 2256694Snp * Copyright (c) 2009-2013 Chelsio, Inc. All rights reserved. 3256694Snp * 4256694Snp * This software is available to you under a choice of one of two 5256694Snp * licenses. You may choose to be licensed under the terms of the GNU 6256694Snp * General Public License (GPL) Version 2, available from the file 7256694Snp * COPYING in the main directory of this source tree, or the 8256694Snp * OpenIB.org BSD license below: 9256694Snp * 10256694Snp * Redistribution and use in source and binary forms, with or 11256694Snp * without modification, are permitted provided that the following 12256694Snp * conditions are met: 13256694Snp * 14256694Snp * - Redistributions of source code must retain the above 15256694Snp * copyright notice, this list of conditions and the following 16256694Snp * disclaimer. 17256694Snp * 18256694Snp * - Redistributions in binary form must reproduce the above 19256694Snp * copyright notice, this list of conditions and the following 20256694Snp * disclaimer in the documentation and/or other materials 21256694Snp * provided with the distribution. 22256694Snp * 23256694Snp * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 24256694Snp * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 25256694Snp * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 26256694Snp * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 27256694Snp * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 28256694Snp * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 29256694Snp * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 30256694Snp * SOFTWARE. 31256694Snp */ 32256694Snp#include <sys/cdefs.h> 33256694Snp__FBSDID("$FreeBSD: head/sys/dev/cxgbe/iw_cxgbe/mem.c 297124 2016-03-21 00:29:45Z np $"); 34256694Snp 35256694Snp#include "opt_inet.h" 36256694Snp 37256694Snp#ifdef TCP_OFFLOAD 38256694Snp#include <linux/types.h> 39256694Snp#include <linux/kref.h> 40256694Snp#include <rdma/ib_umem.h> 41256694Snp#include <asm/atomic.h> 42256694Snp 43256694Snp#include <common/t4_msg.h> 44256694Snp#include "iw_cxgbe.h" 45256694Snp 46256694Snp#define T4_ULPTX_MIN_IO 32 47256694Snp#define C4IW_MAX_INLINE_SIZE 96 48256694Snp 49297124Snpstatic int mr_exceeds_hw_limits(struct c4iw_dev *dev, u64 length) 50297124Snp{ 51297124Snp return (is_t4(dev->rdev.adap) || 52297124Snp is_t5(dev->rdev.adap)) && 53297124Snp length >= 8*1024*1024*1024ULL; 54297124Snp} 55256694Snpstatic int 56256694Snpwrite_adapter_mem(struct c4iw_rdev *rdev, u32 addr, u32 len, void *data) 57256694Snp{ 58256694Snp struct adapter *sc = rdev->adap; 59256694Snp struct ulp_mem_io *ulpmc; 60256694Snp struct ulptx_idata *ulpsc; 61256694Snp u8 wr_len, *to_dp, *from_dp; 62256694Snp int copy_len, num_wqe, i, ret = 0; 63256694Snp struct c4iw_wr_wait wr_wait; 64256694Snp struct wrqe *wr; 65256694Snp u32 cmd; 66256694Snp 67256694Snp cmd = cpu_to_be32(V_ULPTX_CMD(ULP_TX_MEM_WRITE)); 68256694Snp if (is_t4(sc)) 69256694Snp cmd |= cpu_to_be32(F_ULP_MEMIO_ORDER); 70256694Snp else 71256694Snp cmd |= cpu_to_be32(F_T5_ULP_MEMIO_IMM); 72256694Snp 73256694Snp addr &= 0x7FFFFFF; 74256694Snp CTR3(KTR_IW_CXGBE, "%s addr 0x%x len %u", __func__, addr, len); 75256694Snp num_wqe = DIV_ROUND_UP(len, C4IW_MAX_INLINE_SIZE); 76256694Snp c4iw_init_wr_wait(&wr_wait); 77256694Snp for (i = 0; i < num_wqe; i++) { 78256694Snp 79256694Snp copy_len = min(len, C4IW_MAX_INLINE_SIZE); 80256694Snp wr_len = roundup(sizeof *ulpmc + sizeof *ulpsc + 81256694Snp roundup(copy_len, T4_ULPTX_MIN_IO), 16); 82256694Snp 83256694Snp wr = alloc_wrqe(wr_len, &sc->sge.mgmtq); 84256694Snp if (wr == NULL) 85256694Snp return (0); 86256694Snp ulpmc = wrtod(wr); 87256694Snp 88256694Snp memset(ulpmc, 0, wr_len); 89256694Snp INIT_ULPTX_WR(ulpmc, wr_len, 0, 0); 90256694Snp 91256694Snp if (i == (num_wqe-1)) { 92256694Snp ulpmc->wr.wr_hi = cpu_to_be32(V_FW_WR_OP(FW_ULPTX_WR) | 93256694Snp F_FW_WR_COMPL); 94256694Snp ulpmc->wr.wr_lo = (__force __be64)(unsigned long) &wr_wait; 95256694Snp } else 96256694Snp ulpmc->wr.wr_hi = cpu_to_be32(V_FW_WR_OP(FW_ULPTX_WR)); 97256694Snp ulpmc->wr.wr_mid = cpu_to_be32( 98256694Snp V_FW_WR_LEN16(DIV_ROUND_UP(wr_len, 16))); 99256694Snp 100256694Snp ulpmc->cmd = cmd; 101256694Snp ulpmc->dlen = cpu_to_be32(V_ULP_MEMIO_DATA_LEN( 102256694Snp DIV_ROUND_UP(copy_len, T4_ULPTX_MIN_IO))); 103256694Snp ulpmc->len16 = cpu_to_be32(DIV_ROUND_UP(wr_len-sizeof(ulpmc->wr), 104256694Snp 16)); 105256694Snp ulpmc->lock_addr = cpu_to_be32(V_ULP_MEMIO_ADDR(addr + i * 3)); 106256694Snp 107256694Snp ulpsc = (struct ulptx_idata *)(ulpmc + 1); 108256694Snp ulpsc->cmd_more = cpu_to_be32(V_ULPTX_CMD(ULP_TX_SC_IMM)); 109256694Snp ulpsc->len = cpu_to_be32(roundup(copy_len, T4_ULPTX_MIN_IO)); 110256694Snp 111256694Snp to_dp = (u8 *)(ulpsc + 1); 112256694Snp from_dp = (u8 *)data + i * C4IW_MAX_INLINE_SIZE; 113256694Snp if (data) 114256694Snp memcpy(to_dp, from_dp, copy_len); 115256694Snp else 116256694Snp memset(to_dp, 0, copy_len); 117256694Snp if (copy_len % T4_ULPTX_MIN_IO) 118256694Snp memset(to_dp + copy_len, 0, T4_ULPTX_MIN_IO - 119256694Snp (copy_len % T4_ULPTX_MIN_IO)); 120256694Snp t4_wrq_tx(sc, wr); 121256694Snp len -= C4IW_MAX_INLINE_SIZE; 122256694Snp } 123256694Snp 124256694Snp ret = c4iw_wait_for_reply(rdev, &wr_wait, 0, 0, __func__); 125256694Snp return ret; 126256694Snp} 127256694Snp 128256694Snp/* 129256694Snp * Build and write a TPT entry. 130256694Snp * IN: stag key, pdid, perm, bind_enabled, zbva, to, len, page_size, 131256694Snp * pbl_size and pbl_addr 132256694Snp * OUT: stag index 133256694Snp */ 134256694Snpstatic int write_tpt_entry(struct c4iw_rdev *rdev, u32 reset_tpt_entry, 135256694Snp u32 *stag, u8 stag_state, u32 pdid, 136256694Snp enum fw_ri_stag_type type, enum fw_ri_mem_perms perm, 137256694Snp int bind_enabled, u32 zbva, u64 to, 138256694Snp u64 len, u8 page_size, u32 pbl_size, u32 pbl_addr) 139256694Snp{ 140256694Snp int err; 141256694Snp struct fw_ri_tpte tpt; 142256694Snp u32 stag_idx; 143256694Snp static atomic_t key; 144256694Snp 145256694Snp if (c4iw_fatal_error(rdev)) 146256694Snp return -EIO; 147256694Snp 148256694Snp stag_state = stag_state > 0; 149256694Snp stag_idx = (*stag) >> 8; 150256694Snp 151256694Snp if ((!reset_tpt_entry) && (*stag == T4_STAG_UNSET)) { 152256694Snp stag_idx = c4iw_get_resource(&rdev->resource.tpt_table); 153297124Snp if (!stag_idx) { 154297124Snp mutex_lock(&rdev->stats.lock); 155297124Snp rdev->stats.stag.fail++; 156297124Snp mutex_unlock(&rdev->stats.lock); 157256694Snp return -ENOMEM; 158297124Snp } 159256694Snp mutex_lock(&rdev->stats.lock); 160256694Snp rdev->stats.stag.cur += 32; 161256694Snp if (rdev->stats.stag.cur > rdev->stats.stag.max) 162256694Snp rdev->stats.stag.max = rdev->stats.stag.cur; 163256694Snp mutex_unlock(&rdev->stats.lock); 164256694Snp *stag = (stag_idx << 8) | (atomic_inc_return(&key) & 0xff); 165256694Snp } 166256694Snp CTR5(KTR_IW_CXGBE, 167256694Snp "%s stag_state 0x%0x type 0x%0x pdid 0x%0x, stag_idx 0x%x", 168256694Snp __func__, stag_state, type, pdid, stag_idx); 169256694Snp 170256694Snp /* write TPT entry */ 171256694Snp if (reset_tpt_entry) 172256694Snp memset(&tpt, 0, sizeof(tpt)); 173256694Snp else { 174256694Snp tpt.valid_to_pdid = cpu_to_be32(F_FW_RI_TPTE_VALID | 175256694Snp V_FW_RI_TPTE_STAGKEY((*stag & M_FW_RI_TPTE_STAGKEY)) | 176256694Snp V_FW_RI_TPTE_STAGSTATE(stag_state) | 177256694Snp V_FW_RI_TPTE_STAGTYPE(type) | V_FW_RI_TPTE_PDID(pdid)); 178256694Snp tpt.locread_to_qpid = cpu_to_be32(V_FW_RI_TPTE_PERM(perm) | 179256694Snp (bind_enabled ? F_FW_RI_TPTE_MWBINDEN : 0) | 180256694Snp V_FW_RI_TPTE_ADDRTYPE((zbva ? FW_RI_ZERO_BASED_TO : 181256694Snp FW_RI_VA_BASED_TO))| 182256694Snp V_FW_RI_TPTE_PS(page_size)); 183256694Snp tpt.nosnoop_pbladdr = !pbl_size ? 0 : cpu_to_be32( 184256694Snp V_FW_RI_TPTE_PBLADDR(PBL_OFF(rdev, pbl_addr)>>3)); 185256694Snp tpt.len_lo = cpu_to_be32((u32)(len & 0xffffffffUL)); 186256694Snp tpt.va_hi = cpu_to_be32((u32)(to >> 32)); 187256694Snp tpt.va_lo_fbo = cpu_to_be32((u32)(to & 0xffffffffUL)); 188256694Snp tpt.dca_mwbcnt_pstag = cpu_to_be32(0); 189256694Snp tpt.len_hi = cpu_to_be32((u32)(len >> 32)); 190256694Snp } 191256694Snp err = write_adapter_mem(rdev, stag_idx + 192256694Snp (rdev->adap->vres.stag.start >> 5), 193256694Snp sizeof(tpt), &tpt); 194256694Snp 195256694Snp if (reset_tpt_entry) { 196256694Snp c4iw_put_resource(&rdev->resource.tpt_table, stag_idx); 197256694Snp mutex_lock(&rdev->stats.lock); 198256694Snp rdev->stats.stag.cur -= 32; 199256694Snp mutex_unlock(&rdev->stats.lock); 200256694Snp } 201256694Snp return err; 202256694Snp} 203256694Snp 204256694Snpstatic int write_pbl(struct c4iw_rdev *rdev, __be64 *pbl, 205256694Snp u32 pbl_addr, u32 pbl_size) 206256694Snp{ 207256694Snp int err; 208256694Snp 209256694Snp CTR4(KTR_IW_CXGBE, "%s *pdb_addr 0x%x, pbl_base 0x%x, pbl_size %d", 210256694Snp __func__, pbl_addr, rdev->adap->vres.pbl.start, pbl_size); 211256694Snp 212256694Snp err = write_adapter_mem(rdev, pbl_addr >> 5, pbl_size << 3, pbl); 213256694Snp return err; 214256694Snp} 215256694Snp 216256694Snpstatic int dereg_mem(struct c4iw_rdev *rdev, u32 stag, u32 pbl_size, 217256694Snp u32 pbl_addr) 218256694Snp{ 219256694Snp return write_tpt_entry(rdev, 1, &stag, 0, 0, 0, 0, 0, 0, 0UL, 0, 0, 220256694Snp pbl_size, pbl_addr); 221256694Snp} 222256694Snp 223256694Snpstatic int allocate_window(struct c4iw_rdev *rdev, u32 * stag, u32 pdid) 224256694Snp{ 225256694Snp *stag = T4_STAG_UNSET; 226256694Snp return write_tpt_entry(rdev, 0, stag, 0, pdid, FW_RI_STAG_MW, 0, 0, 0, 227256694Snp 0UL, 0, 0, 0, 0); 228256694Snp} 229256694Snp 230256694Snpstatic int deallocate_window(struct c4iw_rdev *rdev, u32 stag) 231256694Snp{ 232256694Snp return write_tpt_entry(rdev, 1, &stag, 0, 0, 0, 0, 0, 0, 0UL, 0, 0, 0, 233256694Snp 0); 234256694Snp} 235256694Snp 236256694Snpstatic int allocate_stag(struct c4iw_rdev *rdev, u32 *stag, u32 pdid, 237256694Snp u32 pbl_size, u32 pbl_addr) 238256694Snp{ 239256694Snp *stag = T4_STAG_UNSET; 240256694Snp return write_tpt_entry(rdev, 0, stag, 0, pdid, FW_RI_STAG_NSMR, 0, 0, 0, 241256694Snp 0UL, 0, 0, pbl_size, pbl_addr); 242256694Snp} 243256694Snp 244256694Snpstatic int finish_mem_reg(struct c4iw_mr *mhp, u32 stag) 245256694Snp{ 246256694Snp u32 mmid; 247256694Snp 248256694Snp mhp->attr.state = 1; 249256694Snp mhp->attr.stag = stag; 250256694Snp mmid = stag >> 8; 251256694Snp mhp->ibmr.rkey = mhp->ibmr.lkey = stag; 252256694Snp CTR3(KTR_IW_CXGBE, "%s mmid 0x%x mhp %p", __func__, mmid, mhp); 253256694Snp return insert_handle(mhp->rhp, &mhp->rhp->mmidr, mhp, mmid); 254256694Snp} 255256694Snp 256256694Snpstatic int register_mem(struct c4iw_dev *rhp, struct c4iw_pd *php, 257256694Snp struct c4iw_mr *mhp, int shift) 258256694Snp{ 259256694Snp u32 stag = T4_STAG_UNSET; 260256694Snp int ret; 261256694Snp 262256694Snp ret = write_tpt_entry(&rhp->rdev, 0, &stag, 1, mhp->attr.pdid, 263297124Snp FW_RI_STAG_NSMR, mhp->attr.len ? mhp->attr.perms : 0, 264256694Snp mhp->attr.mw_bind_enable, mhp->attr.zbva, 265297124Snp mhp->attr.va_fbo, mhp->attr.len ? mhp->attr.len : -1, shift - 12, 266256694Snp mhp->attr.pbl_size, mhp->attr.pbl_addr); 267256694Snp if (ret) 268256694Snp return ret; 269256694Snp 270256694Snp ret = finish_mem_reg(mhp, stag); 271256694Snp if (ret) 272256694Snp dereg_mem(&rhp->rdev, mhp->attr.stag, mhp->attr.pbl_size, 273256694Snp mhp->attr.pbl_addr); 274256694Snp return ret; 275256694Snp} 276256694Snp 277256694Snpstatic int reregister_mem(struct c4iw_dev *rhp, struct c4iw_pd *php, 278256694Snp struct c4iw_mr *mhp, int shift, int npages) 279256694Snp{ 280256694Snp u32 stag; 281256694Snp int ret; 282256694Snp 283256694Snp if (npages > mhp->attr.pbl_size) 284256694Snp return -ENOMEM; 285256694Snp 286256694Snp stag = mhp->attr.stag; 287256694Snp ret = write_tpt_entry(&rhp->rdev, 0, &stag, 1, mhp->attr.pdid, 288256694Snp FW_RI_STAG_NSMR, mhp->attr.perms, 289256694Snp mhp->attr.mw_bind_enable, mhp->attr.zbva, 290256694Snp mhp->attr.va_fbo, mhp->attr.len, shift - 12, 291256694Snp mhp->attr.pbl_size, mhp->attr.pbl_addr); 292256694Snp if (ret) 293256694Snp return ret; 294256694Snp 295256694Snp ret = finish_mem_reg(mhp, stag); 296256694Snp if (ret) 297256694Snp dereg_mem(&rhp->rdev, mhp->attr.stag, mhp->attr.pbl_size, 298256694Snp mhp->attr.pbl_addr); 299256694Snp 300256694Snp return ret; 301256694Snp} 302256694Snp 303256694Snpstatic int alloc_pbl(struct c4iw_mr *mhp, int npages) 304256694Snp{ 305256694Snp mhp->attr.pbl_addr = c4iw_pblpool_alloc(&mhp->rhp->rdev, 306256694Snp npages << 3); 307256694Snp 308256694Snp if (!mhp->attr.pbl_addr) 309256694Snp return -ENOMEM; 310256694Snp 311256694Snp mhp->attr.pbl_size = npages; 312256694Snp 313256694Snp return 0; 314256694Snp} 315256694Snp 316256694Snpstatic int build_phys_page_list(struct ib_phys_buf *buffer_list, 317256694Snp int num_phys_buf, u64 *iova_start, 318256694Snp u64 *total_size, int *npages, 319256694Snp int *shift, __be64 **page_list) 320256694Snp{ 321256694Snp u64 mask; 322256694Snp int i, j, n; 323256694Snp 324256694Snp mask = 0; 325256694Snp *total_size = 0; 326256694Snp for (i = 0; i < num_phys_buf; ++i) { 327256694Snp if (i != 0 && buffer_list[i].addr & ~PAGE_MASK) 328256694Snp return -EINVAL; 329256694Snp if (i != 0 && i != num_phys_buf - 1 && 330256694Snp (buffer_list[i].size & ~PAGE_MASK)) 331256694Snp return -EINVAL; 332256694Snp *total_size += buffer_list[i].size; 333256694Snp if (i > 0) 334256694Snp mask |= buffer_list[i].addr; 335256694Snp else 336256694Snp mask |= buffer_list[i].addr & PAGE_MASK; 337256694Snp if (i != num_phys_buf - 1) 338256694Snp mask |= buffer_list[i].addr + buffer_list[i].size; 339256694Snp else 340256694Snp mask |= (buffer_list[i].addr + buffer_list[i].size + 341256694Snp PAGE_SIZE - 1) & PAGE_MASK; 342256694Snp } 343256694Snp 344256694Snp if (*total_size > 0xFFFFFFFFULL) 345256694Snp return -ENOMEM; 346256694Snp 347256694Snp /* Find largest page shift we can use to cover buffers */ 348256694Snp for (*shift = PAGE_SHIFT; *shift < 27; ++(*shift)) 349256694Snp if ((1ULL << *shift) & mask) 350256694Snp break; 351256694Snp 352256694Snp buffer_list[0].size += buffer_list[0].addr & ((1ULL << *shift) - 1); 353256694Snp buffer_list[0].addr &= ~0ull << *shift; 354256694Snp 355256694Snp *npages = 0; 356256694Snp for (i = 0; i < num_phys_buf; ++i) 357256694Snp *npages += (buffer_list[i].size + 358256694Snp (1ULL << *shift) - 1) >> *shift; 359256694Snp 360256694Snp if (!*npages) 361256694Snp return -EINVAL; 362256694Snp 363256694Snp *page_list = kmalloc(sizeof(u64) * *npages, GFP_KERNEL); 364256694Snp if (!*page_list) 365256694Snp return -ENOMEM; 366256694Snp 367256694Snp n = 0; 368256694Snp for (i = 0; i < num_phys_buf; ++i) 369256694Snp for (j = 0; 370256694Snp j < (buffer_list[i].size + (1ULL << *shift) - 1) >> *shift; 371256694Snp ++j) 372256694Snp (*page_list)[n++] = cpu_to_be64(buffer_list[i].addr + 373256694Snp ((u64) j << *shift)); 374256694Snp 375256694Snp CTR6(KTR_IW_CXGBE, 376256694Snp "%s va 0x%llx mask 0x%llx shift %d len %lld pbl_size %d", __func__, 377256694Snp (unsigned long long)*iova_start, (unsigned long long)mask, *shift, 378256694Snp (unsigned long long)*total_size, *npages); 379256694Snp 380256694Snp return 0; 381256694Snp 382256694Snp} 383256694Snp 384256694Snpint c4iw_reregister_phys_mem(struct ib_mr *mr, int mr_rereg_mask, 385256694Snp struct ib_pd *pd, struct ib_phys_buf *buffer_list, 386256694Snp int num_phys_buf, int acc, u64 *iova_start) 387256694Snp{ 388256694Snp 389256694Snp struct c4iw_mr mh, *mhp; 390256694Snp struct c4iw_pd *php; 391256694Snp struct c4iw_dev *rhp; 392256694Snp __be64 *page_list = NULL; 393256694Snp int shift = 0; 394297124Snp u64 total_size = 0; 395256694Snp int npages = 0; 396256694Snp int ret; 397256694Snp 398256694Snp CTR3(KTR_IW_CXGBE, "%s ib_mr %p ib_pd %p", __func__, mr, pd); 399256694Snp 400256694Snp /* There can be no memory windows */ 401256694Snp if (atomic_read(&mr->usecnt)) 402256694Snp return -EINVAL; 403256694Snp 404256694Snp mhp = to_c4iw_mr(mr); 405256694Snp rhp = mhp->rhp; 406256694Snp php = to_c4iw_pd(mr->pd); 407256694Snp 408256694Snp /* make sure we are on the same adapter */ 409256694Snp if (rhp != php->rhp) 410256694Snp return -EINVAL; 411256694Snp 412256694Snp memcpy(&mh, mhp, sizeof *mhp); 413256694Snp 414256694Snp if (mr_rereg_mask & IB_MR_REREG_PD) 415256694Snp php = to_c4iw_pd(pd); 416256694Snp if (mr_rereg_mask & IB_MR_REREG_ACCESS) { 417256694Snp mh.attr.perms = c4iw_ib_to_tpt_access(acc); 418256694Snp mh.attr.mw_bind_enable = (acc & IB_ACCESS_MW_BIND) == 419256694Snp IB_ACCESS_MW_BIND; 420256694Snp } 421256694Snp if (mr_rereg_mask & IB_MR_REREG_TRANS) { 422256694Snp ret = build_phys_page_list(buffer_list, num_phys_buf, 423256694Snp iova_start, 424256694Snp &total_size, &npages, 425256694Snp &shift, &page_list); 426256694Snp if (ret) 427256694Snp return ret; 428256694Snp } 429297124Snp if (mr_exceeds_hw_limits(rhp, total_size)) { 430297124Snp kfree(page_list); 431297124Snp return -EINVAL; 432297124Snp } 433256694Snp ret = reregister_mem(rhp, php, &mh, shift, npages); 434256694Snp kfree(page_list); 435256694Snp if (ret) 436256694Snp return ret; 437256694Snp if (mr_rereg_mask & IB_MR_REREG_PD) 438256694Snp mhp->attr.pdid = php->pdid; 439256694Snp if (mr_rereg_mask & IB_MR_REREG_ACCESS) 440256694Snp mhp->attr.perms = c4iw_ib_to_tpt_access(acc); 441256694Snp if (mr_rereg_mask & IB_MR_REREG_TRANS) { 442256694Snp mhp->attr.zbva = 0; 443256694Snp mhp->attr.va_fbo = *iova_start; 444256694Snp mhp->attr.page_size = shift - 12; 445256694Snp mhp->attr.len = (u32) total_size; 446256694Snp mhp->attr.pbl_size = npages; 447256694Snp } 448256694Snp 449256694Snp return 0; 450256694Snp} 451256694Snp 452256694Snpstruct ib_mr *c4iw_register_phys_mem(struct ib_pd *pd, 453256694Snp struct ib_phys_buf *buffer_list, 454256694Snp int num_phys_buf, int acc, u64 *iova_start) 455256694Snp{ 456256694Snp __be64 *page_list; 457256694Snp int shift; 458256694Snp u64 total_size; 459256694Snp int npages; 460256694Snp struct c4iw_dev *rhp; 461256694Snp struct c4iw_pd *php; 462256694Snp struct c4iw_mr *mhp; 463256694Snp int ret; 464256694Snp 465256694Snp CTR2(KTR_IW_CXGBE, "%s ib_pd %p", __func__, pd); 466256694Snp php = to_c4iw_pd(pd); 467256694Snp rhp = php->rhp; 468256694Snp 469256694Snp mhp = kzalloc(sizeof(*mhp), GFP_KERNEL); 470256694Snp if (!mhp) 471256694Snp return ERR_PTR(-ENOMEM); 472256694Snp 473256694Snp mhp->rhp = rhp; 474256694Snp 475256694Snp /* First check that we have enough alignment */ 476256694Snp if ((*iova_start & ~PAGE_MASK) != (buffer_list[0].addr & ~PAGE_MASK)) { 477256694Snp ret = -EINVAL; 478256694Snp goto err; 479256694Snp } 480256694Snp 481256694Snp if (num_phys_buf > 1 && 482256694Snp ((buffer_list[0].addr + buffer_list[0].size) & ~PAGE_MASK)) { 483256694Snp ret = -EINVAL; 484256694Snp goto err; 485256694Snp } 486256694Snp 487256694Snp ret = build_phys_page_list(buffer_list, num_phys_buf, iova_start, 488256694Snp &total_size, &npages, &shift, 489256694Snp &page_list); 490256694Snp if (ret) 491256694Snp goto err; 492256694Snp 493297124Snp if (mr_exceeds_hw_limits(rhp, total_size)) { 494297124Snp kfree(page_list); 495297124Snp ret = -EINVAL; 496297124Snp goto err; 497297124Snp } 498256694Snp ret = alloc_pbl(mhp, npages); 499256694Snp if (ret) { 500256694Snp kfree(page_list); 501297124Snp goto err; 502256694Snp } 503256694Snp 504256694Snp ret = write_pbl(&mhp->rhp->rdev, page_list, mhp->attr.pbl_addr, 505256694Snp npages); 506256694Snp kfree(page_list); 507256694Snp if (ret) 508256694Snp goto err_pbl; 509256694Snp 510256694Snp mhp->attr.pdid = php->pdid; 511256694Snp mhp->attr.zbva = 0; 512256694Snp 513256694Snp mhp->attr.perms = c4iw_ib_to_tpt_access(acc); 514256694Snp mhp->attr.va_fbo = *iova_start; 515256694Snp mhp->attr.page_size = shift - 12; 516256694Snp 517256694Snp mhp->attr.len = (u32) total_size; 518256694Snp mhp->attr.pbl_size = npages; 519256694Snp ret = register_mem(rhp, php, mhp, shift); 520256694Snp if (ret) 521256694Snp goto err_pbl; 522256694Snp 523256694Snp return &mhp->ibmr; 524256694Snp 525256694Snperr_pbl: 526256694Snp c4iw_pblpool_free(&mhp->rhp->rdev, mhp->attr.pbl_addr, 527256694Snp mhp->attr.pbl_size << 3); 528256694Snp 529256694Snperr: 530256694Snp kfree(mhp); 531256694Snp return ERR_PTR(ret); 532256694Snp 533256694Snp} 534256694Snp 535256694Snpstruct ib_mr *c4iw_get_dma_mr(struct ib_pd *pd, int acc) 536256694Snp{ 537256694Snp struct c4iw_dev *rhp; 538256694Snp struct c4iw_pd *php; 539256694Snp struct c4iw_mr *mhp; 540256694Snp int ret; 541256694Snp u32 stag = T4_STAG_UNSET; 542256694Snp 543256694Snp CTR2(KTR_IW_CXGBE, "%s ib_pd %p", __func__, pd); 544256694Snp php = to_c4iw_pd(pd); 545256694Snp rhp = php->rhp; 546256694Snp 547256694Snp mhp = kzalloc(sizeof(*mhp), GFP_KERNEL); 548256694Snp if (!mhp) 549256694Snp return ERR_PTR(-ENOMEM); 550256694Snp 551256694Snp mhp->rhp = rhp; 552256694Snp mhp->attr.pdid = php->pdid; 553256694Snp mhp->attr.perms = c4iw_ib_to_tpt_access(acc); 554256694Snp mhp->attr.mw_bind_enable = (acc&IB_ACCESS_MW_BIND) == IB_ACCESS_MW_BIND; 555256694Snp mhp->attr.zbva = 0; 556256694Snp mhp->attr.va_fbo = 0; 557256694Snp mhp->attr.page_size = 0; 558256694Snp mhp->attr.len = ~0UL; 559256694Snp mhp->attr.pbl_size = 0; 560256694Snp 561256694Snp ret = write_tpt_entry(&rhp->rdev, 0, &stag, 1, php->pdid, 562256694Snp FW_RI_STAG_NSMR, mhp->attr.perms, 563256694Snp mhp->attr.mw_bind_enable, 0, 0, ~0UL, 0, 0, 0); 564256694Snp if (ret) 565256694Snp goto err1; 566256694Snp 567256694Snp ret = finish_mem_reg(mhp, stag); 568256694Snp if (ret) 569256694Snp goto err2; 570256694Snp return &mhp->ibmr; 571256694Snperr2: 572256694Snp dereg_mem(&rhp->rdev, mhp->attr.stag, mhp->attr.pbl_size, 573256694Snp mhp->attr.pbl_addr); 574256694Snperr1: 575256694Snp kfree(mhp); 576256694Snp return ERR_PTR(ret); 577256694Snp} 578256694Snp 579256694Snpstruct ib_mr *c4iw_reg_user_mr(struct ib_pd *pd, u64 start, u64 length, 580256694Snp u64 virt, int acc, struct ib_udata *udata, int mr_id) 581256694Snp{ 582256694Snp __be64 *pages; 583256694Snp int shift, n, len; 584278886Shselasky int i, k, entry; 585256694Snp int err = 0; 586278886Shselasky struct scatterlist *sg; 587256694Snp struct c4iw_dev *rhp; 588256694Snp struct c4iw_pd *php; 589256694Snp struct c4iw_mr *mhp; 590256694Snp 591256694Snp CTR2(KTR_IW_CXGBE, "%s ib_pd %p", __func__, pd); 592256694Snp 593256694Snp if (length == ~0ULL) 594256694Snp return ERR_PTR(-EINVAL); 595256694Snp 596256694Snp if ((length + start) < start) 597256694Snp return ERR_PTR(-EINVAL); 598256694Snp 599256694Snp php = to_c4iw_pd(pd); 600256694Snp rhp = php->rhp; 601297124Snp 602297124Snp if (mr_exceeds_hw_limits(rhp, length)) 603297124Snp return ERR_PTR(-EINVAL); 604297124Snp 605256694Snp mhp = kzalloc(sizeof(*mhp), GFP_KERNEL); 606256694Snp if (!mhp) 607256694Snp return ERR_PTR(-ENOMEM); 608256694Snp 609256694Snp mhp->rhp = rhp; 610256694Snp 611256694Snp mhp->umem = ib_umem_get(pd->uobject->context, start, length, acc, 0); 612256694Snp if (IS_ERR(mhp->umem)) { 613256694Snp err = PTR_ERR(mhp->umem); 614256694Snp kfree(mhp); 615256694Snp return ERR_PTR(err); 616256694Snp } 617256694Snp 618256694Snp shift = ffs(mhp->umem->page_size) - 1; 619278886Shselasky 620278886Shselasky n = mhp->umem->nmap; 621256694Snp err = alloc_pbl(mhp, n); 622256694Snp if (err) 623256694Snp goto err; 624256694Snp 625256694Snp pages = (__be64 *) __get_free_page(GFP_KERNEL); 626256694Snp if (!pages) { 627256694Snp err = -ENOMEM; 628256694Snp goto err_pbl; 629256694Snp } 630256694Snp 631256694Snp i = n = 0; 632278886Shselasky for_each_sg(mhp->umem->sg_head.sgl, sg, mhp->umem->nmap, entry) { 633278886Shselasky len = sg_dma_len(sg) >> shift; 634278886Shselasky for (k = 0; k < len; ++k) { 635278886Shselasky pages[i++] = cpu_to_be64(sg_dma_address(sg) + 636278886Shselasky mhp->umem->page_size * k); 637278886Shselasky if (i == PAGE_SIZE / sizeof *pages) { 638278886Shselasky err = write_pbl(&mhp->rhp->rdev, 639278886Shselasky pages, 640278886Shselasky mhp->attr.pbl_addr + (n << 3), i); 641278886Shselasky if (err) 642278886Shselasky goto pbl_done; 643278886Shselasky n += i; 644278886Shselasky i = 0; 645256694Snp 646256694Snp } 647256694Snp } 648278886Shselasky } 649256694Snp 650256694Snp if (i) 651256694Snp err = write_pbl(&mhp->rhp->rdev, pages, 652256694Snp mhp->attr.pbl_addr + (n << 3), i); 653256694Snp 654256694Snppbl_done: 655256694Snp free_page((unsigned long) pages); 656256694Snp if (err) 657256694Snp goto err_pbl; 658256694Snp 659256694Snp mhp->attr.pdid = php->pdid; 660256694Snp mhp->attr.zbva = 0; 661256694Snp mhp->attr.perms = c4iw_ib_to_tpt_access(acc); 662256694Snp mhp->attr.va_fbo = virt; 663256694Snp mhp->attr.page_size = shift - 12; 664256694Snp mhp->attr.len = length; 665256694Snp 666256694Snp err = register_mem(rhp, php, mhp, shift); 667256694Snp if (err) 668256694Snp goto err_pbl; 669256694Snp 670256694Snp return &mhp->ibmr; 671256694Snp 672256694Snperr_pbl: 673256694Snp c4iw_pblpool_free(&mhp->rhp->rdev, mhp->attr.pbl_addr, 674256694Snp mhp->attr.pbl_size << 3); 675256694Snp 676256694Snperr: 677256694Snp ib_umem_release(mhp->umem); 678256694Snp kfree(mhp); 679256694Snp return ERR_PTR(err); 680256694Snp} 681256694Snp 682278886Shselaskystruct ib_mw *c4iw_alloc_mw(struct ib_pd *pd, enum ib_mw_type type) 683256694Snp{ 684256694Snp struct c4iw_dev *rhp; 685256694Snp struct c4iw_pd *php; 686256694Snp struct c4iw_mw *mhp; 687256694Snp u32 mmid; 688256694Snp u32 stag = 0; 689256694Snp int ret; 690256694Snp 691256694Snp php = to_c4iw_pd(pd); 692256694Snp rhp = php->rhp; 693256694Snp mhp = kzalloc(sizeof(*mhp), GFP_KERNEL); 694256694Snp if (!mhp) 695256694Snp return ERR_PTR(-ENOMEM); 696256694Snp ret = allocate_window(&rhp->rdev, &stag, php->pdid); 697256694Snp if (ret) { 698256694Snp kfree(mhp); 699256694Snp return ERR_PTR(ret); 700256694Snp } 701256694Snp mhp->rhp = rhp; 702256694Snp mhp->attr.pdid = php->pdid; 703256694Snp mhp->attr.type = FW_RI_STAG_MW; 704256694Snp mhp->attr.stag = stag; 705256694Snp mmid = (stag) >> 8; 706256694Snp mhp->ibmw.rkey = stag; 707256694Snp if (insert_handle(rhp, &rhp->mmidr, mhp, mmid)) { 708256694Snp deallocate_window(&rhp->rdev, mhp->attr.stag); 709256694Snp kfree(mhp); 710256694Snp return ERR_PTR(-ENOMEM); 711256694Snp } 712256694Snp CTR4(KTR_IW_CXGBE, "%s mmid 0x%x mhp %p stag 0x%x", __func__, mmid, mhp, 713256694Snp stag); 714256694Snp return &(mhp->ibmw); 715256694Snp} 716256694Snp 717256694Snpint c4iw_dealloc_mw(struct ib_mw *mw) 718256694Snp{ 719256694Snp struct c4iw_dev *rhp; 720256694Snp struct c4iw_mw *mhp; 721256694Snp u32 mmid; 722256694Snp 723256694Snp mhp = to_c4iw_mw(mw); 724256694Snp rhp = mhp->rhp; 725256694Snp mmid = (mw->rkey) >> 8; 726256694Snp remove_handle(rhp, &rhp->mmidr, mmid); 727256694Snp deallocate_window(&rhp->rdev, mhp->attr.stag); 728256694Snp kfree(mhp); 729256694Snp CTR4(KTR_IW_CXGBE, "%s ib_mw %p mmid 0x%x ptr %p", __func__, mw, mmid, 730256694Snp mhp); 731256694Snp return 0; 732256694Snp} 733256694Snp 734256694Snpstruct ib_mr *c4iw_alloc_fast_reg_mr(struct ib_pd *pd, int pbl_depth) 735256694Snp{ 736256694Snp struct c4iw_dev *rhp; 737256694Snp struct c4iw_pd *php; 738256694Snp struct c4iw_mr *mhp; 739256694Snp u32 mmid; 740256694Snp u32 stag = 0; 741256694Snp int ret = 0; 742256694Snp 743256694Snp php = to_c4iw_pd(pd); 744256694Snp rhp = php->rhp; 745256694Snp mhp = kzalloc(sizeof(*mhp), GFP_KERNEL); 746256694Snp if (!mhp) { 747256694Snp ret = -ENOMEM; 748256694Snp goto err; 749256694Snp } 750256694Snp 751256694Snp mhp->rhp = rhp; 752256694Snp ret = alloc_pbl(mhp, pbl_depth); 753256694Snp if (ret) 754256694Snp goto err1; 755256694Snp mhp->attr.pbl_size = pbl_depth; 756256694Snp ret = allocate_stag(&rhp->rdev, &stag, php->pdid, 757256694Snp mhp->attr.pbl_size, mhp->attr.pbl_addr); 758256694Snp if (ret) 759256694Snp goto err2; 760256694Snp mhp->attr.pdid = php->pdid; 761256694Snp mhp->attr.type = FW_RI_STAG_NSMR; 762256694Snp mhp->attr.stag = stag; 763256694Snp mhp->attr.state = 1; 764256694Snp mmid = (stag) >> 8; 765256694Snp mhp->ibmr.rkey = mhp->ibmr.lkey = stag; 766256694Snp if (insert_handle(rhp, &rhp->mmidr, mhp, mmid)) { 767256694Snp ret = -ENOMEM; 768256694Snp goto err3; 769256694Snp } 770256694Snp 771256694Snp CTR4(KTR_IW_CXGBE, "%s mmid 0x%x mhp %p stag 0x%x", __func__, mmid, mhp, 772256694Snp stag); 773256694Snp return &(mhp->ibmr); 774256694Snperr3: 775256694Snp dereg_mem(&rhp->rdev, stag, mhp->attr.pbl_size, 776256694Snp mhp->attr.pbl_addr); 777256694Snperr2: 778256694Snp c4iw_pblpool_free(&mhp->rhp->rdev, mhp->attr.pbl_addr, 779256694Snp mhp->attr.pbl_size << 3); 780256694Snperr1: 781256694Snp kfree(mhp); 782256694Snperr: 783256694Snp return ERR_PTR(ret); 784256694Snp} 785256694Snp 786256694Snpstruct ib_fast_reg_page_list *c4iw_alloc_fastreg_pbl(struct ib_device *device, 787256694Snp int page_list_len) 788256694Snp{ 789256694Snp struct c4iw_fr_page_list *c4pl; 790256694Snp struct c4iw_dev *dev = to_c4iw_dev(device); 791256694Snp bus_addr_t dma_addr; 792256694Snp int size = sizeof *c4pl + page_list_len * sizeof(u64); 793256694Snp 794256694Snp c4pl = contigmalloc(size, 795256694Snp M_DEVBUF, M_NOWAIT, 0ul, ~0ul, 4096, 0); 796256694Snp if (c4pl) 797256694Snp dma_addr = vtophys(c4pl); 798256694Snp else 799256694Snp return ERR_PTR(-ENOMEM);; 800256694Snp 801256694Snp pci_unmap_addr_set(c4pl, mapping, dma_addr); 802256694Snp c4pl->dma_addr = dma_addr; 803256694Snp c4pl->dev = dev; 804256694Snp c4pl->size = size; 805256694Snp c4pl->ibpl.page_list = (u64 *)(c4pl + 1); 806256694Snp c4pl->ibpl.max_page_list_len = page_list_len; 807256694Snp 808256694Snp return &c4pl->ibpl; 809256694Snp} 810256694Snp 811256694Snpvoid c4iw_free_fastreg_pbl(struct ib_fast_reg_page_list *ibpl) 812256694Snp{ 813256694Snp struct c4iw_fr_page_list *c4pl = to_c4iw_fr_page_list(ibpl); 814256694Snp contigfree(c4pl, c4pl->size, M_DEVBUF); 815256694Snp} 816256694Snp 817256694Snpint c4iw_dereg_mr(struct ib_mr *ib_mr) 818256694Snp{ 819256694Snp struct c4iw_dev *rhp; 820256694Snp struct c4iw_mr *mhp; 821256694Snp u32 mmid; 822256694Snp 823256694Snp CTR2(KTR_IW_CXGBE, "%s ib_mr %p", __func__, ib_mr); 824256694Snp /* There can be no memory windows */ 825256694Snp if (atomic_read(&ib_mr->usecnt)) 826256694Snp return -EINVAL; 827256694Snp 828256694Snp mhp = to_c4iw_mr(ib_mr); 829256694Snp rhp = mhp->rhp; 830256694Snp mmid = mhp->attr.stag >> 8; 831256694Snp remove_handle(rhp, &rhp->mmidr, mmid); 832256694Snp dereg_mem(&rhp->rdev, mhp->attr.stag, mhp->attr.pbl_size, 833256694Snp mhp->attr.pbl_addr); 834256694Snp if (mhp->attr.pbl_size) 835256694Snp c4iw_pblpool_free(&mhp->rhp->rdev, mhp->attr.pbl_addr, 836256694Snp mhp->attr.pbl_size << 3); 837256694Snp if (mhp->kva) 838256694Snp kfree((void *) (unsigned long) mhp->kva); 839256694Snp if (mhp->umem) 840256694Snp ib_umem_release(mhp->umem); 841256694Snp CTR3(KTR_IW_CXGBE, "%s mmid 0x%x ptr %p", __func__, mmid, mhp); 842256694Snp kfree(mhp); 843256694Snp return 0; 844256694Snp} 845256694Snp#endif 846