Path: blob/master/drivers/infiniband/hw/ehca/ehca_mrmw.c
15112 views
/*1* IBM eServer eHCA Infiniband device driver for Linux on POWER2*3* MR/MW functions4*5* Authors: Dietmar Decker <[email protected]>6* Christoph Raisch <[email protected]>7* Hoang-Nam Nguyen <[email protected]>8*9* Copyright (c) 2005 IBM Corporation10*11* All rights reserved.12*13* This source code is distributed under a dual license of GPL v2.0 and OpenIB14* BSD.15*16* OpenIB BSD License17*18* Redistribution and use in source and binary forms, with or without19* modification, are permitted provided that the following conditions are met:20*21* Redistributions of source code must retain the above copyright notice, this22* list of conditions and the following disclaimer.23*24* Redistributions in binary form must reproduce the above copyright notice,25* this list of conditions and the following disclaimer in the documentation26* and/or other materials27* provided with the distribution.28*29* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"30* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE31* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE32* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE33* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR34* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF35* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR36* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER37* IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)38* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE39* POSSIBILITY OF SUCH DAMAGE.40*/4142#include <linux/slab.h>43#include <rdma/ib_umem.h>4445#include "ehca_iverbs.h"46#include "ehca_mrmw.h"47#include "hcp_if.h"48#include "hipz_hw.h"4950#define NUM_CHUNKS(length, chunk_size) \51(((length) + (chunk_size - 1)) / (chunk_size))5253/* max number of rpages (per hcall register_rpages) */54#define MAX_RPAGES 5125556/* DMEM toleration management */57#define EHCA_SECTSHIFT SECTION_SIZE_BITS58#define EHCA_SECTSIZE (1UL << EHCA_SECTSHIFT)59#define EHCA_HUGEPAGESHIFT 3460#define EHCA_HUGEPAGE_SIZE (1UL << EHCA_HUGEPAGESHIFT)61#define EHCA_HUGEPAGE_PFN_MASK ((EHCA_HUGEPAGE_SIZE - 1) >> PAGE_SHIFT)62#define EHCA_INVAL_ADDR 0xFFFFFFFFFFFFFFFFULL63#define EHCA_DIR_INDEX_SHIFT 13 /* 8k Entries in 64k block */64#define EHCA_TOP_INDEX_SHIFT (EHCA_DIR_INDEX_SHIFT * 2)65#define EHCA_MAP_ENTRIES (1 << EHCA_DIR_INDEX_SHIFT)66#define EHCA_TOP_MAP_SIZE (0x10000) /* currently fixed map size */67#define EHCA_DIR_MAP_SIZE (0x10000)68#define EHCA_ENT_MAP_SIZE (0x10000)69#define EHCA_INDEX_MASK (EHCA_MAP_ENTRIES - 1)7071static unsigned long ehca_mr_len;7273/*74* Memory map data structures75*/76struct ehca_dir_bmap {77u64 ent[EHCA_MAP_ENTRIES];78};79struct ehca_top_bmap {80struct ehca_dir_bmap *dir[EHCA_MAP_ENTRIES];81};82struct ehca_bmap {83struct ehca_top_bmap *top[EHCA_MAP_ENTRIES];84};8586static struct ehca_bmap *ehca_bmap;8788static struct kmem_cache *mr_cache;89static struct kmem_cache *mw_cache;9091enum ehca_mr_pgsize {92EHCA_MR_PGSIZE4K = 0x1000L,93EHCA_MR_PGSIZE64K = 0x10000L,94EHCA_MR_PGSIZE1M = 0x100000L,95EHCA_MR_PGSIZE16M = 0x1000000L96};9798#define EHCA_MR_PGSHIFT4K 1299#define EHCA_MR_PGSHIFT64K 16100#define EHCA_MR_PGSHIFT1M 20101#define EHCA_MR_PGSHIFT16M 24102103static u64 ehca_map_vaddr(void *caddr);104105static u32 ehca_encode_hwpage_size(u32 pgsize)106{107int log = ilog2(pgsize);108WARN_ON(log < 12 || log > 24 || log & 3);109return (log - 12) / 4;110}111112static u64 ehca_get_max_hwpage_size(struct ehca_shca *shca)113{114return 1UL << ilog2(shca->hca_cap_mr_pgsize);115}116117static struct ehca_mr *ehca_mr_new(void)118{119struct ehca_mr *me;120121me = kmem_cache_zalloc(mr_cache, GFP_KERNEL);122if (me)123spin_lock_init(&me->mrlock);124else125ehca_gen_err("alloc failed");126127return me;128}129130static void ehca_mr_delete(struct ehca_mr *me)131{132kmem_cache_free(mr_cache, me);133}134135static struct ehca_mw *ehca_mw_new(void)136{137struct ehca_mw *me;138139me = kmem_cache_zalloc(mw_cache, GFP_KERNEL);140if (me)141spin_lock_init(&me->mwlock);142else143ehca_gen_err("alloc failed");144145return me;146}147148static void ehca_mw_delete(struct ehca_mw *me)149{150kmem_cache_free(mw_cache, me);151}152153/*----------------------------------------------------------------------*/154155struct ib_mr *ehca_get_dma_mr(struct ib_pd *pd, int mr_access_flags)156{157struct ib_mr *ib_mr;158int ret;159struct ehca_mr *e_maxmr;160struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);161struct ehca_shca *shca =162container_of(pd->device, struct ehca_shca, ib_device);163164if (shca->maxmr) {165e_maxmr = ehca_mr_new();166if (!e_maxmr) {167ehca_err(&shca->ib_device, "out of memory");168ib_mr = ERR_PTR(-ENOMEM);169goto get_dma_mr_exit0;170}171172ret = ehca_reg_maxmr(shca, e_maxmr,173(void *)ehca_map_vaddr((void *)(KERNELBASE + PHYSICAL_START)),174mr_access_flags, e_pd,175&e_maxmr->ib.ib_mr.lkey,176&e_maxmr->ib.ib_mr.rkey);177if (ret) {178ehca_mr_delete(e_maxmr);179ib_mr = ERR_PTR(ret);180goto get_dma_mr_exit0;181}182ib_mr = &e_maxmr->ib.ib_mr;183} else {184ehca_err(&shca->ib_device, "no internal max-MR exist!");185ib_mr = ERR_PTR(-EINVAL);186goto get_dma_mr_exit0;187}188189get_dma_mr_exit0:190if (IS_ERR(ib_mr))191ehca_err(&shca->ib_device, "h_ret=%li pd=%p mr_access_flags=%x",192PTR_ERR(ib_mr), pd, mr_access_flags);193return ib_mr;194} /* end ehca_get_dma_mr() */195196/*----------------------------------------------------------------------*/197198struct ib_mr *ehca_reg_phys_mr(struct ib_pd *pd,199struct ib_phys_buf *phys_buf_array,200int num_phys_buf,201int mr_access_flags,202u64 *iova_start)203{204struct ib_mr *ib_mr;205int ret;206struct ehca_mr *e_mr;207struct ehca_shca *shca =208container_of(pd->device, struct ehca_shca, ib_device);209struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);210211u64 size;212213if ((num_phys_buf <= 0) || !phys_buf_array) {214ehca_err(pd->device, "bad input values: num_phys_buf=%x "215"phys_buf_array=%p", num_phys_buf, phys_buf_array);216ib_mr = ERR_PTR(-EINVAL);217goto reg_phys_mr_exit0;218}219if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&220!(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||221((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&222!(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {223/*224* Remote Write Access requires Local Write Access225* Remote Atomic Access requires Local Write Access226*/227ehca_err(pd->device, "bad input values: mr_access_flags=%x",228mr_access_flags);229ib_mr = ERR_PTR(-EINVAL);230goto reg_phys_mr_exit0;231}232233/* check physical buffer list and calculate size */234ret = ehca_mr_chk_buf_and_calc_size(phys_buf_array, num_phys_buf,235iova_start, &size);236if (ret) {237ib_mr = ERR_PTR(ret);238goto reg_phys_mr_exit0;239}240if ((size == 0) ||241(((u64)iova_start + size) < (u64)iova_start)) {242ehca_err(pd->device, "bad input values: size=%llx iova_start=%p",243size, iova_start);244ib_mr = ERR_PTR(-EINVAL);245goto reg_phys_mr_exit0;246}247248e_mr = ehca_mr_new();249if (!e_mr) {250ehca_err(pd->device, "out of memory");251ib_mr = ERR_PTR(-ENOMEM);252goto reg_phys_mr_exit0;253}254255/* register MR on HCA */256if (ehca_mr_is_maxmr(size, iova_start)) {257e_mr->flags |= EHCA_MR_FLAG_MAXMR;258ret = ehca_reg_maxmr(shca, e_mr, iova_start, mr_access_flags,259e_pd, &e_mr->ib.ib_mr.lkey,260&e_mr->ib.ib_mr.rkey);261if (ret) {262ib_mr = ERR_PTR(ret);263goto reg_phys_mr_exit1;264}265} else {266struct ehca_mr_pginfo pginfo;267u32 num_kpages;268u32 num_hwpages;269u64 hw_pgsize;270271num_kpages = NUM_CHUNKS(((u64)iova_start % PAGE_SIZE) + size,272PAGE_SIZE);273/* for kernel space we try most possible pgsize */274hw_pgsize = ehca_get_max_hwpage_size(shca);275num_hwpages = NUM_CHUNKS(((u64)iova_start % hw_pgsize) + size,276hw_pgsize);277memset(&pginfo, 0, sizeof(pginfo));278pginfo.type = EHCA_MR_PGI_PHYS;279pginfo.num_kpages = num_kpages;280pginfo.hwpage_size = hw_pgsize;281pginfo.num_hwpages = num_hwpages;282pginfo.u.phy.num_phys_buf = num_phys_buf;283pginfo.u.phy.phys_buf_array = phys_buf_array;284pginfo.next_hwpage =285((u64)iova_start & ~PAGE_MASK) / hw_pgsize;286287ret = ehca_reg_mr(shca, e_mr, iova_start, size, mr_access_flags,288e_pd, &pginfo, &e_mr->ib.ib_mr.lkey,289&e_mr->ib.ib_mr.rkey, EHCA_REG_MR);290if (ret) {291ib_mr = ERR_PTR(ret);292goto reg_phys_mr_exit1;293}294}295296/* successful registration of all pages */297return &e_mr->ib.ib_mr;298299reg_phys_mr_exit1:300ehca_mr_delete(e_mr);301reg_phys_mr_exit0:302if (IS_ERR(ib_mr))303ehca_err(pd->device, "h_ret=%li pd=%p phys_buf_array=%p "304"num_phys_buf=%x mr_access_flags=%x iova_start=%p",305PTR_ERR(ib_mr), pd, phys_buf_array,306num_phys_buf, mr_access_flags, iova_start);307return ib_mr;308} /* end ehca_reg_phys_mr() */309310/*----------------------------------------------------------------------*/311312struct ib_mr *ehca_reg_user_mr(struct ib_pd *pd, u64 start, u64 length,313u64 virt, int mr_access_flags,314struct ib_udata *udata)315{316struct ib_mr *ib_mr;317struct ehca_mr *e_mr;318struct ehca_shca *shca =319container_of(pd->device, struct ehca_shca, ib_device);320struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);321struct ehca_mr_pginfo pginfo;322int ret, page_shift;323u32 num_kpages;324u32 num_hwpages;325u64 hwpage_size;326327if (!pd) {328ehca_gen_err("bad pd=%p", pd);329return ERR_PTR(-EFAULT);330}331332if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&333!(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||334((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&335!(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {336/*337* Remote Write Access requires Local Write Access338* Remote Atomic Access requires Local Write Access339*/340ehca_err(pd->device, "bad input values: mr_access_flags=%x",341mr_access_flags);342ib_mr = ERR_PTR(-EINVAL);343goto reg_user_mr_exit0;344}345346if (length == 0 || virt + length < virt) {347ehca_err(pd->device, "bad input values: length=%llx "348"virt_base=%llx", length, virt);349ib_mr = ERR_PTR(-EINVAL);350goto reg_user_mr_exit0;351}352353e_mr = ehca_mr_new();354if (!e_mr) {355ehca_err(pd->device, "out of memory");356ib_mr = ERR_PTR(-ENOMEM);357goto reg_user_mr_exit0;358}359360e_mr->umem = ib_umem_get(pd->uobject->context, start, length,361mr_access_flags, 0);362if (IS_ERR(e_mr->umem)) {363ib_mr = (void *)e_mr->umem;364goto reg_user_mr_exit1;365}366367if (e_mr->umem->page_size != PAGE_SIZE) {368ehca_err(pd->device, "page size not supported, "369"e_mr->umem->page_size=%x", e_mr->umem->page_size);370ib_mr = ERR_PTR(-EINVAL);371goto reg_user_mr_exit2;372}373374/* determine number of MR pages */375num_kpages = NUM_CHUNKS((virt % PAGE_SIZE) + length, PAGE_SIZE);376/* select proper hw_pgsize */377page_shift = PAGE_SHIFT;378if (e_mr->umem->hugetlb) {379/* determine page_shift, clamp between 4K and 16M */380page_shift = (fls64(length - 1) + 3) & ~3;381page_shift = min(max(page_shift, EHCA_MR_PGSHIFT4K),382EHCA_MR_PGSHIFT16M);383}384hwpage_size = 1UL << page_shift;385386/* now that we have the desired page size, shift until it's387* supported, too. 4K is always supported, so this terminates.388*/389while (!(hwpage_size & shca->hca_cap_mr_pgsize))390hwpage_size >>= 4;391392reg_user_mr_fallback:393num_hwpages = NUM_CHUNKS((virt % hwpage_size) + length, hwpage_size);394/* register MR on HCA */395memset(&pginfo, 0, sizeof(pginfo));396pginfo.type = EHCA_MR_PGI_USER;397pginfo.hwpage_size = hwpage_size;398pginfo.num_kpages = num_kpages;399pginfo.num_hwpages = num_hwpages;400pginfo.u.usr.region = e_mr->umem;401pginfo.next_hwpage = e_mr->umem->offset / hwpage_size;402pginfo.u.usr.next_chunk = list_prepare_entry(pginfo.u.usr.next_chunk,403(&e_mr->umem->chunk_list),404list);405406ret = ehca_reg_mr(shca, e_mr, (u64 *)virt, length, mr_access_flags,407e_pd, &pginfo, &e_mr->ib.ib_mr.lkey,408&e_mr->ib.ib_mr.rkey, EHCA_REG_MR);409if (ret == -EINVAL && pginfo.hwpage_size > PAGE_SIZE) {410ehca_warn(pd->device, "failed to register mr "411"with hwpage_size=%llx", hwpage_size);412ehca_info(pd->device, "try to register mr with "413"kpage_size=%lx", PAGE_SIZE);414/*415* this means kpages are not contiguous for a hw page416* try kernel page size as fallback solution417*/418hwpage_size = PAGE_SIZE;419goto reg_user_mr_fallback;420}421if (ret) {422ib_mr = ERR_PTR(ret);423goto reg_user_mr_exit2;424}425426/* successful registration of all pages */427return &e_mr->ib.ib_mr;428429reg_user_mr_exit2:430ib_umem_release(e_mr->umem);431reg_user_mr_exit1:432ehca_mr_delete(e_mr);433reg_user_mr_exit0:434if (IS_ERR(ib_mr))435ehca_err(pd->device, "rc=%li pd=%p mr_access_flags=%x udata=%p",436PTR_ERR(ib_mr), pd, mr_access_flags, udata);437return ib_mr;438} /* end ehca_reg_user_mr() */439440/*----------------------------------------------------------------------*/441442int ehca_rereg_phys_mr(struct ib_mr *mr,443int mr_rereg_mask,444struct ib_pd *pd,445struct ib_phys_buf *phys_buf_array,446int num_phys_buf,447int mr_access_flags,448u64 *iova_start)449{450int ret;451452struct ehca_shca *shca =453container_of(mr->device, struct ehca_shca, ib_device);454struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);455u64 new_size;456u64 *new_start;457u32 new_acl;458struct ehca_pd *new_pd;459u32 tmp_lkey, tmp_rkey;460unsigned long sl_flags;461u32 num_kpages = 0;462u32 num_hwpages = 0;463struct ehca_mr_pginfo pginfo;464465if (!(mr_rereg_mask & IB_MR_REREG_TRANS)) {466/* TODO not supported, because PHYP rereg hCall needs pages */467ehca_err(mr->device, "rereg without IB_MR_REREG_TRANS not "468"supported yet, mr_rereg_mask=%x", mr_rereg_mask);469ret = -EINVAL;470goto rereg_phys_mr_exit0;471}472473if (mr_rereg_mask & IB_MR_REREG_PD) {474if (!pd) {475ehca_err(mr->device, "rereg with bad pd, pd=%p "476"mr_rereg_mask=%x", pd, mr_rereg_mask);477ret = -EINVAL;478goto rereg_phys_mr_exit0;479}480}481482if ((mr_rereg_mask &483~(IB_MR_REREG_TRANS | IB_MR_REREG_PD | IB_MR_REREG_ACCESS)) ||484(mr_rereg_mask == 0)) {485ret = -EINVAL;486goto rereg_phys_mr_exit0;487}488489/* check other parameters */490if (e_mr == shca->maxmr) {491/* should be impossible, however reject to be sure */492ehca_err(mr->device, "rereg internal max-MR impossible, mr=%p "493"shca->maxmr=%p mr->lkey=%x",494mr, shca->maxmr, mr->lkey);495ret = -EINVAL;496goto rereg_phys_mr_exit0;497}498if (mr_rereg_mask & IB_MR_REREG_TRANS) { /* transl., i.e. addr/size */499if (e_mr->flags & EHCA_MR_FLAG_FMR) {500ehca_err(mr->device, "not supported for FMR, mr=%p "501"flags=%x", mr, e_mr->flags);502ret = -EINVAL;503goto rereg_phys_mr_exit0;504}505if (!phys_buf_array || num_phys_buf <= 0) {506ehca_err(mr->device, "bad input values mr_rereg_mask=%x"507" phys_buf_array=%p num_phys_buf=%x",508mr_rereg_mask, phys_buf_array, num_phys_buf);509ret = -EINVAL;510goto rereg_phys_mr_exit0;511}512}513if ((mr_rereg_mask & IB_MR_REREG_ACCESS) && /* change ACL */514(((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&515!(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||516((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&517!(mr_access_flags & IB_ACCESS_LOCAL_WRITE)))) {518/*519* Remote Write Access requires Local Write Access520* Remote Atomic Access requires Local Write Access521*/522ehca_err(mr->device, "bad input values: mr_rereg_mask=%x "523"mr_access_flags=%x", mr_rereg_mask, mr_access_flags);524ret = -EINVAL;525goto rereg_phys_mr_exit0;526}527528/* set requested values dependent on rereg request */529spin_lock_irqsave(&e_mr->mrlock, sl_flags);530new_start = e_mr->start;531new_size = e_mr->size;532new_acl = e_mr->acl;533new_pd = container_of(mr->pd, struct ehca_pd, ib_pd);534535if (mr_rereg_mask & IB_MR_REREG_TRANS) {536u64 hw_pgsize = ehca_get_max_hwpage_size(shca);537538new_start = iova_start; /* change address */539/* check physical buffer list and calculate size */540ret = ehca_mr_chk_buf_and_calc_size(phys_buf_array,541num_phys_buf, iova_start,542&new_size);543if (ret)544goto rereg_phys_mr_exit1;545if ((new_size == 0) ||546(((u64)iova_start + new_size) < (u64)iova_start)) {547ehca_err(mr->device, "bad input values: new_size=%llx "548"iova_start=%p", new_size, iova_start);549ret = -EINVAL;550goto rereg_phys_mr_exit1;551}552num_kpages = NUM_CHUNKS(((u64)new_start % PAGE_SIZE) +553new_size, PAGE_SIZE);554num_hwpages = NUM_CHUNKS(((u64)new_start % hw_pgsize) +555new_size, hw_pgsize);556memset(&pginfo, 0, sizeof(pginfo));557pginfo.type = EHCA_MR_PGI_PHYS;558pginfo.num_kpages = num_kpages;559pginfo.hwpage_size = hw_pgsize;560pginfo.num_hwpages = num_hwpages;561pginfo.u.phy.num_phys_buf = num_phys_buf;562pginfo.u.phy.phys_buf_array = phys_buf_array;563pginfo.next_hwpage =564((u64)iova_start & ~PAGE_MASK) / hw_pgsize;565}566if (mr_rereg_mask & IB_MR_REREG_ACCESS)567new_acl = mr_access_flags;568if (mr_rereg_mask & IB_MR_REREG_PD)569new_pd = container_of(pd, struct ehca_pd, ib_pd);570571ret = ehca_rereg_mr(shca, e_mr, new_start, new_size, new_acl,572new_pd, &pginfo, &tmp_lkey, &tmp_rkey);573if (ret)574goto rereg_phys_mr_exit1;575576/* successful reregistration */577if (mr_rereg_mask & IB_MR_REREG_PD)578mr->pd = pd;579mr->lkey = tmp_lkey;580mr->rkey = tmp_rkey;581582rereg_phys_mr_exit1:583spin_unlock_irqrestore(&e_mr->mrlock, sl_flags);584rereg_phys_mr_exit0:585if (ret)586ehca_err(mr->device, "ret=%i mr=%p mr_rereg_mask=%x pd=%p "587"phys_buf_array=%p num_phys_buf=%x mr_access_flags=%x "588"iova_start=%p",589ret, mr, mr_rereg_mask, pd, phys_buf_array,590num_phys_buf, mr_access_flags, iova_start);591return ret;592} /* end ehca_rereg_phys_mr() */593594/*----------------------------------------------------------------------*/595596int ehca_query_mr(struct ib_mr *mr, struct ib_mr_attr *mr_attr)597{598int ret = 0;599u64 h_ret;600struct ehca_shca *shca =601container_of(mr->device, struct ehca_shca, ib_device);602struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);603unsigned long sl_flags;604struct ehca_mr_hipzout_parms hipzout;605606if ((e_mr->flags & EHCA_MR_FLAG_FMR)) {607ehca_err(mr->device, "not supported for FMR, mr=%p e_mr=%p "608"e_mr->flags=%x", mr, e_mr, e_mr->flags);609ret = -EINVAL;610goto query_mr_exit0;611}612613memset(mr_attr, 0, sizeof(struct ib_mr_attr));614spin_lock_irqsave(&e_mr->mrlock, sl_flags);615616h_ret = hipz_h_query_mr(shca->ipz_hca_handle, e_mr, &hipzout);617if (h_ret != H_SUCCESS) {618ehca_err(mr->device, "hipz_mr_query failed, h_ret=%lli mr=%p "619"hca_hndl=%llx mr_hndl=%llx lkey=%x",620h_ret, mr, shca->ipz_hca_handle.handle,621e_mr->ipz_mr_handle.handle, mr->lkey);622ret = ehca2ib_return_code(h_ret);623goto query_mr_exit1;624}625mr_attr->pd = mr->pd;626mr_attr->device_virt_addr = hipzout.vaddr;627mr_attr->size = hipzout.len;628mr_attr->lkey = hipzout.lkey;629mr_attr->rkey = hipzout.rkey;630ehca_mrmw_reverse_map_acl(&hipzout.acl, &mr_attr->mr_access_flags);631632query_mr_exit1:633spin_unlock_irqrestore(&e_mr->mrlock, sl_flags);634query_mr_exit0:635if (ret)636ehca_err(mr->device, "ret=%i mr=%p mr_attr=%p",637ret, mr, mr_attr);638return ret;639} /* end ehca_query_mr() */640641/*----------------------------------------------------------------------*/642643int ehca_dereg_mr(struct ib_mr *mr)644{645int ret = 0;646u64 h_ret;647struct ehca_shca *shca =648container_of(mr->device, struct ehca_shca, ib_device);649struct ehca_mr *e_mr = container_of(mr, struct ehca_mr, ib.ib_mr);650651if ((e_mr->flags & EHCA_MR_FLAG_FMR)) {652ehca_err(mr->device, "not supported for FMR, mr=%p e_mr=%p "653"e_mr->flags=%x", mr, e_mr, e_mr->flags);654ret = -EINVAL;655goto dereg_mr_exit0;656} else if (e_mr == shca->maxmr) {657/* should be impossible, however reject to be sure */658ehca_err(mr->device, "dereg internal max-MR impossible, mr=%p "659"shca->maxmr=%p mr->lkey=%x",660mr, shca->maxmr, mr->lkey);661ret = -EINVAL;662goto dereg_mr_exit0;663}664665/* TODO: BUSY: MR still has bound window(s) */666h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);667if (h_ret != H_SUCCESS) {668ehca_err(mr->device, "hipz_free_mr failed, h_ret=%lli shca=%p "669"e_mr=%p hca_hndl=%llx mr_hndl=%llx mr->lkey=%x",670h_ret, shca, e_mr, shca->ipz_hca_handle.handle,671e_mr->ipz_mr_handle.handle, mr->lkey);672ret = ehca2ib_return_code(h_ret);673goto dereg_mr_exit0;674}675676if (e_mr->umem)677ib_umem_release(e_mr->umem);678679/* successful deregistration */680ehca_mr_delete(e_mr);681682dereg_mr_exit0:683if (ret)684ehca_err(mr->device, "ret=%i mr=%p", ret, mr);685return ret;686} /* end ehca_dereg_mr() */687688/*----------------------------------------------------------------------*/689690struct ib_mw *ehca_alloc_mw(struct ib_pd *pd)691{692struct ib_mw *ib_mw;693u64 h_ret;694struct ehca_mw *e_mw;695struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);696struct ehca_shca *shca =697container_of(pd->device, struct ehca_shca, ib_device);698struct ehca_mw_hipzout_parms hipzout;699700e_mw = ehca_mw_new();701if (!e_mw) {702ib_mw = ERR_PTR(-ENOMEM);703goto alloc_mw_exit0;704}705706h_ret = hipz_h_alloc_resource_mw(shca->ipz_hca_handle, e_mw,707e_pd->fw_pd, &hipzout);708if (h_ret != H_SUCCESS) {709ehca_err(pd->device, "hipz_mw_allocate failed, h_ret=%lli "710"shca=%p hca_hndl=%llx mw=%p",711h_ret, shca, shca->ipz_hca_handle.handle, e_mw);712ib_mw = ERR_PTR(ehca2ib_return_code(h_ret));713goto alloc_mw_exit1;714}715/* successful MW allocation */716e_mw->ipz_mw_handle = hipzout.handle;717e_mw->ib_mw.rkey = hipzout.rkey;718return &e_mw->ib_mw;719720alloc_mw_exit1:721ehca_mw_delete(e_mw);722alloc_mw_exit0:723if (IS_ERR(ib_mw))724ehca_err(pd->device, "h_ret=%li pd=%p", PTR_ERR(ib_mw), pd);725return ib_mw;726} /* end ehca_alloc_mw() */727728/*----------------------------------------------------------------------*/729730int ehca_bind_mw(struct ib_qp *qp,731struct ib_mw *mw,732struct ib_mw_bind *mw_bind)733{734/* TODO: not supported up to now */735ehca_gen_err("bind MW currently not supported by HCAD");736737return -EPERM;738} /* end ehca_bind_mw() */739740/*----------------------------------------------------------------------*/741742int ehca_dealloc_mw(struct ib_mw *mw)743{744u64 h_ret;745struct ehca_shca *shca =746container_of(mw->device, struct ehca_shca, ib_device);747struct ehca_mw *e_mw = container_of(mw, struct ehca_mw, ib_mw);748749h_ret = hipz_h_free_resource_mw(shca->ipz_hca_handle, e_mw);750if (h_ret != H_SUCCESS) {751ehca_err(mw->device, "hipz_free_mw failed, h_ret=%lli shca=%p "752"mw=%p rkey=%x hca_hndl=%llx mw_hndl=%llx",753h_ret, shca, mw, mw->rkey, shca->ipz_hca_handle.handle,754e_mw->ipz_mw_handle.handle);755return ehca2ib_return_code(h_ret);756}757/* successful deallocation */758ehca_mw_delete(e_mw);759return 0;760} /* end ehca_dealloc_mw() */761762/*----------------------------------------------------------------------*/763764struct ib_fmr *ehca_alloc_fmr(struct ib_pd *pd,765int mr_access_flags,766struct ib_fmr_attr *fmr_attr)767{768struct ib_fmr *ib_fmr;769struct ehca_shca *shca =770container_of(pd->device, struct ehca_shca, ib_device);771struct ehca_pd *e_pd = container_of(pd, struct ehca_pd, ib_pd);772struct ehca_mr *e_fmr;773int ret;774u32 tmp_lkey, tmp_rkey;775struct ehca_mr_pginfo pginfo;776u64 hw_pgsize;777778/* check other parameters */779if (((mr_access_flags & IB_ACCESS_REMOTE_WRITE) &&780!(mr_access_flags & IB_ACCESS_LOCAL_WRITE)) ||781((mr_access_flags & IB_ACCESS_REMOTE_ATOMIC) &&782!(mr_access_flags & IB_ACCESS_LOCAL_WRITE))) {783/*784* Remote Write Access requires Local Write Access785* Remote Atomic Access requires Local Write Access786*/787ehca_err(pd->device, "bad input values: mr_access_flags=%x",788mr_access_flags);789ib_fmr = ERR_PTR(-EINVAL);790goto alloc_fmr_exit0;791}792if (mr_access_flags & IB_ACCESS_MW_BIND) {793ehca_err(pd->device, "bad input values: mr_access_flags=%x",794mr_access_flags);795ib_fmr = ERR_PTR(-EINVAL);796goto alloc_fmr_exit0;797}798if ((fmr_attr->max_pages == 0) || (fmr_attr->max_maps == 0)) {799ehca_err(pd->device, "bad input values: fmr_attr->max_pages=%x "800"fmr_attr->max_maps=%x fmr_attr->page_shift=%x",801fmr_attr->max_pages, fmr_attr->max_maps,802fmr_attr->page_shift);803ib_fmr = ERR_PTR(-EINVAL);804goto alloc_fmr_exit0;805}806807hw_pgsize = 1 << fmr_attr->page_shift;808if (!(hw_pgsize & shca->hca_cap_mr_pgsize)) {809ehca_err(pd->device, "unsupported fmr_attr->page_shift=%x",810fmr_attr->page_shift);811ib_fmr = ERR_PTR(-EINVAL);812goto alloc_fmr_exit0;813}814815e_fmr = ehca_mr_new();816if (!e_fmr) {817ib_fmr = ERR_PTR(-ENOMEM);818goto alloc_fmr_exit0;819}820e_fmr->flags |= EHCA_MR_FLAG_FMR;821822/* register MR on HCA */823memset(&pginfo, 0, sizeof(pginfo));824pginfo.hwpage_size = hw_pgsize;825/*826* pginfo.num_hwpages==0, ie register_rpages() will not be called827* but deferred to map_phys_fmr()828*/829ret = ehca_reg_mr(shca, e_fmr, NULL,830fmr_attr->max_pages * (1 << fmr_attr->page_shift),831mr_access_flags, e_pd, &pginfo,832&tmp_lkey, &tmp_rkey, EHCA_REG_MR);833if (ret) {834ib_fmr = ERR_PTR(ret);835goto alloc_fmr_exit1;836}837838/* successful */839e_fmr->hwpage_size = hw_pgsize;840e_fmr->fmr_page_size = 1 << fmr_attr->page_shift;841e_fmr->fmr_max_pages = fmr_attr->max_pages;842e_fmr->fmr_max_maps = fmr_attr->max_maps;843e_fmr->fmr_map_cnt = 0;844return &e_fmr->ib.ib_fmr;845846alloc_fmr_exit1:847ehca_mr_delete(e_fmr);848alloc_fmr_exit0:849return ib_fmr;850} /* end ehca_alloc_fmr() */851852/*----------------------------------------------------------------------*/853854int ehca_map_phys_fmr(struct ib_fmr *fmr,855u64 *page_list,856int list_len,857u64 iova)858{859int ret;860struct ehca_shca *shca =861container_of(fmr->device, struct ehca_shca, ib_device);862struct ehca_mr *e_fmr = container_of(fmr, struct ehca_mr, ib.ib_fmr);863struct ehca_pd *e_pd = container_of(fmr->pd, struct ehca_pd, ib_pd);864struct ehca_mr_pginfo pginfo;865u32 tmp_lkey, tmp_rkey;866867if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {868ehca_err(fmr->device, "not a FMR, e_fmr=%p e_fmr->flags=%x",869e_fmr, e_fmr->flags);870ret = -EINVAL;871goto map_phys_fmr_exit0;872}873ret = ehca_fmr_check_page_list(e_fmr, page_list, list_len);874if (ret)875goto map_phys_fmr_exit0;876if (iova % e_fmr->fmr_page_size) {877/* only whole-numbered pages */878ehca_err(fmr->device, "bad iova, iova=%llx fmr_page_size=%x",879iova, e_fmr->fmr_page_size);880ret = -EINVAL;881goto map_phys_fmr_exit0;882}883if (e_fmr->fmr_map_cnt >= e_fmr->fmr_max_maps) {884/* HCAD does not limit the maps, however trace this anyway */885ehca_info(fmr->device, "map limit exceeded, fmr=%p "886"e_fmr->fmr_map_cnt=%x e_fmr->fmr_max_maps=%x",887fmr, e_fmr->fmr_map_cnt, e_fmr->fmr_max_maps);888}889890memset(&pginfo, 0, sizeof(pginfo));891pginfo.type = EHCA_MR_PGI_FMR;892pginfo.num_kpages = list_len;893pginfo.hwpage_size = e_fmr->hwpage_size;894pginfo.num_hwpages =895list_len * e_fmr->fmr_page_size / pginfo.hwpage_size;896pginfo.u.fmr.page_list = page_list;897pginfo.next_hwpage =898(iova & (e_fmr->fmr_page_size-1)) / pginfo.hwpage_size;899pginfo.u.fmr.fmr_pgsize = e_fmr->fmr_page_size;900901ret = ehca_rereg_mr(shca, e_fmr, (u64 *)iova,902list_len * e_fmr->fmr_page_size,903e_fmr->acl, e_pd, &pginfo, &tmp_lkey, &tmp_rkey);904if (ret)905goto map_phys_fmr_exit0;906907/* successful reregistration */908e_fmr->fmr_map_cnt++;909e_fmr->ib.ib_fmr.lkey = tmp_lkey;910e_fmr->ib.ib_fmr.rkey = tmp_rkey;911return 0;912913map_phys_fmr_exit0:914if (ret)915ehca_err(fmr->device, "ret=%i fmr=%p page_list=%p list_len=%x "916"iova=%llx", ret, fmr, page_list, list_len, iova);917return ret;918} /* end ehca_map_phys_fmr() */919920/*----------------------------------------------------------------------*/921922int ehca_unmap_fmr(struct list_head *fmr_list)923{924int ret = 0;925struct ib_fmr *ib_fmr;926struct ehca_shca *shca = NULL;927struct ehca_shca *prev_shca;928struct ehca_mr *e_fmr;929u32 num_fmr = 0;930u32 unmap_fmr_cnt = 0;931932/* check all FMR belong to same SHCA, and check internal flag */933list_for_each_entry(ib_fmr, fmr_list, list) {934prev_shca = shca;935shca = container_of(ib_fmr->device, struct ehca_shca,936ib_device);937e_fmr = container_of(ib_fmr, struct ehca_mr, ib.ib_fmr);938if ((shca != prev_shca) && prev_shca) {939ehca_err(&shca->ib_device, "SHCA mismatch, shca=%p "940"prev_shca=%p e_fmr=%p",941shca, prev_shca, e_fmr);942ret = -EINVAL;943goto unmap_fmr_exit0;944}945if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {946ehca_err(&shca->ib_device, "not a FMR, e_fmr=%p "947"e_fmr->flags=%x", e_fmr, e_fmr->flags);948ret = -EINVAL;949goto unmap_fmr_exit0;950}951num_fmr++;952}953954/* loop over all FMRs to unmap */955list_for_each_entry(ib_fmr, fmr_list, list) {956unmap_fmr_cnt++;957e_fmr = container_of(ib_fmr, struct ehca_mr, ib.ib_fmr);958shca = container_of(ib_fmr->device, struct ehca_shca,959ib_device);960ret = ehca_unmap_one_fmr(shca, e_fmr);961if (ret) {962/* unmap failed, stop unmapping of rest of FMRs */963ehca_err(&shca->ib_device, "unmap of one FMR failed, "964"stop rest, e_fmr=%p num_fmr=%x "965"unmap_fmr_cnt=%x lkey=%x", e_fmr, num_fmr,966unmap_fmr_cnt, e_fmr->ib.ib_fmr.lkey);967goto unmap_fmr_exit0;968}969}970971unmap_fmr_exit0:972if (ret)973ehca_gen_err("ret=%i fmr_list=%p num_fmr=%x unmap_fmr_cnt=%x",974ret, fmr_list, num_fmr, unmap_fmr_cnt);975return ret;976} /* end ehca_unmap_fmr() */977978/*----------------------------------------------------------------------*/979980int ehca_dealloc_fmr(struct ib_fmr *fmr)981{982int ret;983u64 h_ret;984struct ehca_shca *shca =985container_of(fmr->device, struct ehca_shca, ib_device);986struct ehca_mr *e_fmr = container_of(fmr, struct ehca_mr, ib.ib_fmr);987988if (!(e_fmr->flags & EHCA_MR_FLAG_FMR)) {989ehca_err(fmr->device, "not a FMR, e_fmr=%p e_fmr->flags=%x",990e_fmr, e_fmr->flags);991ret = -EINVAL;992goto free_fmr_exit0;993}994995h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_fmr);996if (h_ret != H_SUCCESS) {997ehca_err(fmr->device, "hipz_free_mr failed, h_ret=%lli e_fmr=%p "998"hca_hndl=%llx fmr_hndl=%llx fmr->lkey=%x",999h_ret, e_fmr, shca->ipz_hca_handle.handle,1000e_fmr->ipz_mr_handle.handle, fmr->lkey);1001ret = ehca2ib_return_code(h_ret);1002goto free_fmr_exit0;1003}1004/* successful deregistration */1005ehca_mr_delete(e_fmr);1006return 0;10071008free_fmr_exit0:1009if (ret)1010ehca_err(&shca->ib_device, "ret=%i fmr=%p", ret, fmr);1011return ret;1012} /* end ehca_dealloc_fmr() */10131014/*----------------------------------------------------------------------*/10151016static int ehca_reg_bmap_mr_rpages(struct ehca_shca *shca,1017struct ehca_mr *e_mr,1018struct ehca_mr_pginfo *pginfo);10191020int ehca_reg_mr(struct ehca_shca *shca,1021struct ehca_mr *e_mr,1022u64 *iova_start,1023u64 size,1024int acl,1025struct ehca_pd *e_pd,1026struct ehca_mr_pginfo *pginfo,1027u32 *lkey, /*OUT*/1028u32 *rkey, /*OUT*/1029enum ehca_reg_type reg_type)1030{1031int ret;1032u64 h_ret;1033u32 hipz_acl;1034struct ehca_mr_hipzout_parms hipzout;10351036ehca_mrmw_map_acl(acl, &hipz_acl);1037ehca_mrmw_set_pgsize_hipz_acl(pginfo->hwpage_size, &hipz_acl);1038if (ehca_use_hp_mr == 1)1039hipz_acl |= 0x00000001;10401041h_ret = hipz_h_alloc_resource_mr(shca->ipz_hca_handle, e_mr,1042(u64)iova_start, size, hipz_acl,1043e_pd->fw_pd, &hipzout);1044if (h_ret != H_SUCCESS) {1045ehca_err(&shca->ib_device, "hipz_alloc_mr failed, h_ret=%lli "1046"hca_hndl=%llx", h_ret, shca->ipz_hca_handle.handle);1047ret = ehca2ib_return_code(h_ret);1048goto ehca_reg_mr_exit0;1049}10501051e_mr->ipz_mr_handle = hipzout.handle;10521053if (reg_type == EHCA_REG_BUSMAP_MR)1054ret = ehca_reg_bmap_mr_rpages(shca, e_mr, pginfo);1055else if (reg_type == EHCA_REG_MR)1056ret = ehca_reg_mr_rpages(shca, e_mr, pginfo);1057else1058ret = -EINVAL;10591060if (ret)1061goto ehca_reg_mr_exit1;10621063/* successful registration */1064e_mr->num_kpages = pginfo->num_kpages;1065e_mr->num_hwpages = pginfo->num_hwpages;1066e_mr->hwpage_size = pginfo->hwpage_size;1067e_mr->start = iova_start;1068e_mr->size = size;1069e_mr->acl = acl;1070*lkey = hipzout.lkey;1071*rkey = hipzout.rkey;1072return 0;10731074ehca_reg_mr_exit1:1075h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);1076if (h_ret != H_SUCCESS) {1077ehca_err(&shca->ib_device, "h_ret=%lli shca=%p e_mr=%p "1078"iova_start=%p size=%llx acl=%x e_pd=%p lkey=%x "1079"pginfo=%p num_kpages=%llx num_hwpages=%llx ret=%i",1080h_ret, shca, e_mr, iova_start, size, acl, e_pd,1081hipzout.lkey, pginfo, pginfo->num_kpages,1082pginfo->num_hwpages, ret);1083ehca_err(&shca->ib_device, "internal error in ehca_reg_mr, "1084"not recoverable");1085}1086ehca_reg_mr_exit0:1087if (ret)1088ehca_err(&shca->ib_device, "ret=%i shca=%p e_mr=%p "1089"iova_start=%p size=%llx acl=%x e_pd=%p pginfo=%p "1090"num_kpages=%llx num_hwpages=%llx",1091ret, shca, e_mr, iova_start, size, acl, e_pd, pginfo,1092pginfo->num_kpages, pginfo->num_hwpages);1093return ret;1094} /* end ehca_reg_mr() */10951096/*----------------------------------------------------------------------*/10971098int ehca_reg_mr_rpages(struct ehca_shca *shca,1099struct ehca_mr *e_mr,1100struct ehca_mr_pginfo *pginfo)1101{1102int ret = 0;1103u64 h_ret;1104u32 rnum;1105u64 rpage;1106u32 i;1107u64 *kpage;11081109if (!pginfo->num_hwpages) /* in case of fmr */1110return 0;11111112kpage = ehca_alloc_fw_ctrlblock(GFP_KERNEL);1113if (!kpage) {1114ehca_err(&shca->ib_device, "kpage alloc failed");1115ret = -ENOMEM;1116goto ehca_reg_mr_rpages_exit0;1117}11181119/* max MAX_RPAGES ehca mr pages per register call */1120for (i = 0; i < NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES); i++) {11211122if (i == NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES) - 1) {1123rnum = pginfo->num_hwpages % MAX_RPAGES; /* last shot */1124if (rnum == 0)1125rnum = MAX_RPAGES; /* last shot is full */1126} else1127rnum = MAX_RPAGES;11281129ret = ehca_set_pagebuf(pginfo, rnum, kpage);1130if (ret) {1131ehca_err(&shca->ib_device, "ehca_set_pagebuf "1132"bad rc, ret=%i rnum=%x kpage=%p",1133ret, rnum, kpage);1134goto ehca_reg_mr_rpages_exit1;1135}11361137if (rnum > 1) {1138rpage = virt_to_abs(kpage);1139if (!rpage) {1140ehca_err(&shca->ib_device, "kpage=%p i=%x",1141kpage, i);1142ret = -EFAULT;1143goto ehca_reg_mr_rpages_exit1;1144}1145} else1146rpage = *kpage;11471148h_ret = hipz_h_register_rpage_mr(1149shca->ipz_hca_handle, e_mr,1150ehca_encode_hwpage_size(pginfo->hwpage_size),11510, rpage, rnum);11521153if (i == NUM_CHUNKS(pginfo->num_hwpages, MAX_RPAGES) - 1) {1154/*1155* check for 'registration complete'==H_SUCCESS1156* and for 'page registered'==H_PAGE_REGISTERED1157*/1158if (h_ret != H_SUCCESS) {1159ehca_err(&shca->ib_device, "last "1160"hipz_reg_rpage_mr failed, h_ret=%lli "1161"e_mr=%p i=%x hca_hndl=%llx mr_hndl=%llx"1162" lkey=%x", h_ret, e_mr, i,1163shca->ipz_hca_handle.handle,1164e_mr->ipz_mr_handle.handle,1165e_mr->ib.ib_mr.lkey);1166ret = ehca2ib_return_code(h_ret);1167break;1168} else1169ret = 0;1170} else if (h_ret != H_PAGE_REGISTERED) {1171ehca_err(&shca->ib_device, "hipz_reg_rpage_mr failed, "1172"h_ret=%lli e_mr=%p i=%x lkey=%x hca_hndl=%llx "1173"mr_hndl=%llx", h_ret, e_mr, i,1174e_mr->ib.ib_mr.lkey,1175shca->ipz_hca_handle.handle,1176e_mr->ipz_mr_handle.handle);1177ret = ehca2ib_return_code(h_ret);1178break;1179} else1180ret = 0;1181} /* end for(i) */118211831184ehca_reg_mr_rpages_exit1:1185ehca_free_fw_ctrlblock(kpage);1186ehca_reg_mr_rpages_exit0:1187if (ret)1188ehca_err(&shca->ib_device, "ret=%i shca=%p e_mr=%p pginfo=%p "1189"num_kpages=%llx num_hwpages=%llx", ret, shca, e_mr,1190pginfo, pginfo->num_kpages, pginfo->num_hwpages);1191return ret;1192} /* end ehca_reg_mr_rpages() */11931194/*----------------------------------------------------------------------*/11951196inline int ehca_rereg_mr_rereg1(struct ehca_shca *shca,1197struct ehca_mr *e_mr,1198u64 *iova_start,1199u64 size,1200u32 acl,1201struct ehca_pd *e_pd,1202struct ehca_mr_pginfo *pginfo,1203u32 *lkey, /*OUT*/1204u32 *rkey) /*OUT*/1205{1206int ret;1207u64 h_ret;1208u32 hipz_acl;1209u64 *kpage;1210u64 rpage;1211struct ehca_mr_pginfo pginfo_save;1212struct ehca_mr_hipzout_parms hipzout;12131214ehca_mrmw_map_acl(acl, &hipz_acl);1215ehca_mrmw_set_pgsize_hipz_acl(pginfo->hwpage_size, &hipz_acl);12161217kpage = ehca_alloc_fw_ctrlblock(GFP_KERNEL);1218if (!kpage) {1219ehca_err(&shca->ib_device, "kpage alloc failed");1220ret = -ENOMEM;1221goto ehca_rereg_mr_rereg1_exit0;1222}12231224pginfo_save = *pginfo;1225ret = ehca_set_pagebuf(pginfo, pginfo->num_hwpages, kpage);1226if (ret) {1227ehca_err(&shca->ib_device, "set pagebuf failed, e_mr=%p "1228"pginfo=%p type=%x num_kpages=%llx num_hwpages=%llx "1229"kpage=%p", e_mr, pginfo, pginfo->type,1230pginfo->num_kpages, pginfo->num_hwpages, kpage);1231goto ehca_rereg_mr_rereg1_exit1;1232}1233rpage = virt_to_abs(kpage);1234if (!rpage) {1235ehca_err(&shca->ib_device, "kpage=%p", kpage);1236ret = -EFAULT;1237goto ehca_rereg_mr_rereg1_exit1;1238}1239h_ret = hipz_h_reregister_pmr(shca->ipz_hca_handle, e_mr,1240(u64)iova_start, size, hipz_acl,1241e_pd->fw_pd, rpage, &hipzout);1242if (h_ret != H_SUCCESS) {1243/*1244* reregistration unsuccessful, try it again with the 3 hCalls,1245* e.g. this is required in case H_MR_CONDITION1246* (MW bound or MR is shared)1247*/1248ehca_warn(&shca->ib_device, "hipz_h_reregister_pmr failed "1249"(Rereg1), h_ret=%lli e_mr=%p", h_ret, e_mr);1250*pginfo = pginfo_save;1251ret = -EAGAIN;1252} else if ((u64 *)hipzout.vaddr != iova_start) {1253ehca_err(&shca->ib_device, "PHYP changed iova_start in "1254"rereg_pmr, iova_start=%p iova_start_out=%llx e_mr=%p "1255"mr_handle=%llx lkey=%x lkey_out=%x", iova_start,1256hipzout.vaddr, e_mr, e_mr->ipz_mr_handle.handle,1257e_mr->ib.ib_mr.lkey, hipzout.lkey);1258ret = -EFAULT;1259} else {1260/*1261* successful reregistration1262* note: start and start_out are identical for eServer HCAs1263*/1264e_mr->num_kpages = pginfo->num_kpages;1265e_mr->num_hwpages = pginfo->num_hwpages;1266e_mr->hwpage_size = pginfo->hwpage_size;1267e_mr->start = iova_start;1268e_mr->size = size;1269e_mr->acl = acl;1270*lkey = hipzout.lkey;1271*rkey = hipzout.rkey;1272}12731274ehca_rereg_mr_rereg1_exit1:1275ehca_free_fw_ctrlblock(kpage);1276ehca_rereg_mr_rereg1_exit0:1277if ( ret && (ret != -EAGAIN) )1278ehca_err(&shca->ib_device, "ret=%i lkey=%x rkey=%x "1279"pginfo=%p num_kpages=%llx num_hwpages=%llx",1280ret, *lkey, *rkey, pginfo, pginfo->num_kpages,1281pginfo->num_hwpages);1282return ret;1283} /* end ehca_rereg_mr_rereg1() */12841285/*----------------------------------------------------------------------*/12861287int ehca_rereg_mr(struct ehca_shca *shca,1288struct ehca_mr *e_mr,1289u64 *iova_start,1290u64 size,1291int acl,1292struct ehca_pd *e_pd,1293struct ehca_mr_pginfo *pginfo,1294u32 *lkey,1295u32 *rkey)1296{1297int ret = 0;1298u64 h_ret;1299int rereg_1_hcall = 1; /* 1: use hipz_h_reregister_pmr directly */1300int rereg_3_hcall = 0; /* 1: use 3 hipz calls for reregistration */13011302/* first determine reregistration hCall(s) */1303if ((pginfo->num_hwpages > MAX_RPAGES) ||1304(e_mr->num_hwpages > MAX_RPAGES) ||1305(pginfo->num_hwpages > e_mr->num_hwpages)) {1306ehca_dbg(&shca->ib_device, "Rereg3 case, "1307"pginfo->num_hwpages=%llx e_mr->num_hwpages=%x",1308pginfo->num_hwpages, e_mr->num_hwpages);1309rereg_1_hcall = 0;1310rereg_3_hcall = 1;1311}13121313if (e_mr->flags & EHCA_MR_FLAG_MAXMR) { /* check for max-MR */1314rereg_1_hcall = 0;1315rereg_3_hcall = 1;1316e_mr->flags &= ~EHCA_MR_FLAG_MAXMR;1317ehca_err(&shca->ib_device, "Rereg MR for max-MR! e_mr=%p",1318e_mr);1319}13201321if (rereg_1_hcall) {1322ret = ehca_rereg_mr_rereg1(shca, e_mr, iova_start, size,1323acl, e_pd, pginfo, lkey, rkey);1324if (ret) {1325if (ret == -EAGAIN)1326rereg_3_hcall = 1;1327else1328goto ehca_rereg_mr_exit0;1329}1330}13311332if (rereg_3_hcall) {1333struct ehca_mr save_mr;13341335/* first deregister old MR */1336h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_mr);1337if (h_ret != H_SUCCESS) {1338ehca_err(&shca->ib_device, "hipz_free_mr failed, "1339"h_ret=%lli e_mr=%p hca_hndl=%llx mr_hndl=%llx "1340"mr->lkey=%x",1341h_ret, e_mr, shca->ipz_hca_handle.handle,1342e_mr->ipz_mr_handle.handle,1343e_mr->ib.ib_mr.lkey);1344ret = ehca2ib_return_code(h_ret);1345goto ehca_rereg_mr_exit0;1346}1347/* clean ehca_mr_t, without changing struct ib_mr and lock */1348save_mr = *e_mr;1349ehca_mr_deletenew(e_mr);13501351/* set some MR values */1352e_mr->flags = save_mr.flags;1353e_mr->hwpage_size = save_mr.hwpage_size;1354e_mr->fmr_page_size = save_mr.fmr_page_size;1355e_mr->fmr_max_pages = save_mr.fmr_max_pages;1356e_mr->fmr_max_maps = save_mr.fmr_max_maps;1357e_mr->fmr_map_cnt = save_mr.fmr_map_cnt;13581359ret = ehca_reg_mr(shca, e_mr, iova_start, size, acl,1360e_pd, pginfo, lkey, rkey, EHCA_REG_MR);1361if (ret) {1362u32 offset = (u64)(&e_mr->flags) - (u64)e_mr;1363memcpy(&e_mr->flags, &(save_mr.flags),1364sizeof(struct ehca_mr) - offset);1365goto ehca_rereg_mr_exit0;1366}1367}13681369ehca_rereg_mr_exit0:1370if (ret)1371ehca_err(&shca->ib_device, "ret=%i shca=%p e_mr=%p "1372"iova_start=%p size=%llx acl=%x e_pd=%p pginfo=%p "1373"num_kpages=%llx lkey=%x rkey=%x rereg_1_hcall=%x "1374"rereg_3_hcall=%x", ret, shca, e_mr, iova_start, size,1375acl, e_pd, pginfo, pginfo->num_kpages, *lkey, *rkey,1376rereg_1_hcall, rereg_3_hcall);1377return ret;1378} /* end ehca_rereg_mr() */13791380/*----------------------------------------------------------------------*/13811382int ehca_unmap_one_fmr(struct ehca_shca *shca,1383struct ehca_mr *e_fmr)1384{1385int ret = 0;1386u64 h_ret;1387struct ehca_pd *e_pd =1388container_of(e_fmr->ib.ib_fmr.pd, struct ehca_pd, ib_pd);1389struct ehca_mr save_fmr;1390u32 tmp_lkey, tmp_rkey;1391struct ehca_mr_pginfo pginfo;1392struct ehca_mr_hipzout_parms hipzout;1393struct ehca_mr save_mr;13941395if (e_fmr->fmr_max_pages <= MAX_RPAGES) {1396/*1397* note: after using rereg hcall with len=0,1398* rereg hcall must be used again for registering pages1399*/1400h_ret = hipz_h_reregister_pmr(shca->ipz_hca_handle, e_fmr, 0,14010, 0, e_pd->fw_pd, 0, &hipzout);1402if (h_ret == H_SUCCESS) {1403/* successful reregistration */1404e_fmr->start = NULL;1405e_fmr->size = 0;1406tmp_lkey = hipzout.lkey;1407tmp_rkey = hipzout.rkey;1408return 0;1409}1410/*1411* should not happen, because length checked above,1412* FMRs are not shared and no MW bound to FMRs1413*/1414ehca_err(&shca->ib_device, "hipz_reregister_pmr failed "1415"(Rereg1), h_ret=%lli e_fmr=%p hca_hndl=%llx "1416"mr_hndl=%llx lkey=%x lkey_out=%x",1417h_ret, e_fmr, shca->ipz_hca_handle.handle,1418e_fmr->ipz_mr_handle.handle,1419e_fmr->ib.ib_fmr.lkey, hipzout.lkey);1420/* try free and rereg */1421}14221423/* first free old FMR */1424h_ret = hipz_h_free_resource_mr(shca->ipz_hca_handle, e_fmr);1425if (h_ret != H_SUCCESS) {1426ehca_err(&shca->ib_device, "hipz_free_mr failed, "1427"h_ret=%lli e_fmr=%p hca_hndl=%llx mr_hndl=%llx "1428"lkey=%x",1429h_ret, e_fmr, shca->ipz_hca_handle.handle,1430e_fmr->ipz_mr_handle.handle,1431e_fmr->ib.ib_fmr.lkey);1432ret = ehca2ib_return_code(h_ret);1433goto ehca_unmap_one_fmr_exit0;1434}1435/* clean ehca_mr_t, without changing lock */1436save_fmr = *e_fmr;1437ehca_mr_deletenew(e_fmr);14381439/* set some MR values */1440e_fmr->flags = save_fmr.flags;1441e_fmr->hwpage_size = save_fmr.hwpage_size;1442e_fmr->fmr_page_size = save_fmr.fmr_page_size;1443e_fmr->fmr_max_pages = save_fmr.fmr_max_pages;1444e_fmr->fmr_max_maps = save_fmr.fmr_max_maps;1445e_fmr->fmr_map_cnt = save_fmr.fmr_map_cnt;1446e_fmr->acl = save_fmr.acl;14471448memset(&pginfo, 0, sizeof(pginfo));1449pginfo.type = EHCA_MR_PGI_FMR;1450ret = ehca_reg_mr(shca, e_fmr, NULL,1451(e_fmr->fmr_max_pages * e_fmr->fmr_page_size),1452e_fmr->acl, e_pd, &pginfo, &tmp_lkey,1453&tmp_rkey, EHCA_REG_MR);1454if (ret) {1455u32 offset = (u64)(&e_fmr->flags) - (u64)e_fmr;1456memcpy(&e_fmr->flags, &(save_mr.flags),1457sizeof(struct ehca_mr) - offset);1458}14591460ehca_unmap_one_fmr_exit0:1461if (ret)1462ehca_err(&shca->ib_device, "ret=%i tmp_lkey=%x tmp_rkey=%x "1463"fmr_max_pages=%x",1464ret, tmp_lkey, tmp_rkey, e_fmr->fmr_max_pages);1465return ret;1466} /* end ehca_unmap_one_fmr() */14671468/*----------------------------------------------------------------------*/14691470int ehca_reg_smr(struct ehca_shca *shca,1471struct ehca_mr *e_origmr,1472struct ehca_mr *e_newmr,1473u64 *iova_start,1474int acl,1475struct ehca_pd *e_pd,1476u32 *lkey, /*OUT*/1477u32 *rkey) /*OUT*/1478{1479int ret = 0;1480u64 h_ret;1481u32 hipz_acl;1482struct ehca_mr_hipzout_parms hipzout;14831484ehca_mrmw_map_acl(acl, &hipz_acl);1485ehca_mrmw_set_pgsize_hipz_acl(e_origmr->hwpage_size, &hipz_acl);14861487h_ret = hipz_h_register_smr(shca->ipz_hca_handle, e_newmr, e_origmr,1488(u64)iova_start, hipz_acl, e_pd->fw_pd,1489&hipzout);1490if (h_ret != H_SUCCESS) {1491ehca_err(&shca->ib_device, "hipz_reg_smr failed, h_ret=%lli "1492"shca=%p e_origmr=%p e_newmr=%p iova_start=%p acl=%x "1493"e_pd=%p hca_hndl=%llx mr_hndl=%llx lkey=%x",1494h_ret, shca, e_origmr, e_newmr, iova_start, acl, e_pd,1495shca->ipz_hca_handle.handle,1496e_origmr->ipz_mr_handle.handle,1497e_origmr->ib.ib_mr.lkey);1498ret = ehca2ib_return_code(h_ret);1499goto ehca_reg_smr_exit0;1500}1501/* successful registration */1502e_newmr->num_kpages = e_origmr->num_kpages;1503e_newmr->num_hwpages = e_origmr->num_hwpages;1504e_newmr->hwpage_size = e_origmr->hwpage_size;1505e_newmr->start = iova_start;1506e_newmr->size = e_origmr->size;1507e_newmr->acl = acl;1508e_newmr->ipz_mr_handle = hipzout.handle;1509*lkey = hipzout.lkey;1510*rkey = hipzout.rkey;1511return 0;15121513ehca_reg_smr_exit0:1514if (ret)1515ehca_err(&shca->ib_device, "ret=%i shca=%p e_origmr=%p "1516"e_newmr=%p iova_start=%p acl=%x e_pd=%p",1517ret, shca, e_origmr, e_newmr, iova_start, acl, e_pd);1518return ret;1519} /* end ehca_reg_smr() */15201521/*----------------------------------------------------------------------*/1522static inline void *ehca_calc_sectbase(int top, int dir, int idx)1523{1524unsigned long ret = idx;1525ret |= dir << EHCA_DIR_INDEX_SHIFT;1526ret |= top << EHCA_TOP_INDEX_SHIFT;1527return abs_to_virt(ret << SECTION_SIZE_BITS);1528}15291530#define ehca_bmap_valid(entry) \1531((u64)entry != (u64)EHCA_INVAL_ADDR)15321533static u64 ehca_reg_mr_section(int top, int dir, int idx, u64 *kpage,1534struct ehca_shca *shca, struct ehca_mr *mr,1535struct ehca_mr_pginfo *pginfo)1536{1537u64 h_ret = 0;1538unsigned long page = 0;1539u64 rpage = virt_to_abs(kpage);1540int page_count;15411542void *sectbase = ehca_calc_sectbase(top, dir, idx);1543if ((unsigned long)sectbase & (pginfo->hwpage_size - 1)) {1544ehca_err(&shca->ib_device, "reg_mr_section will probably fail:"1545"hwpage_size does not fit to "1546"section start address");1547}1548page_count = EHCA_SECTSIZE / pginfo->hwpage_size;15491550while (page < page_count) {1551u64 rnum;1552for (rnum = 0; (rnum < MAX_RPAGES) && (page < page_count);1553rnum++) {1554void *pg = sectbase + ((page++) * pginfo->hwpage_size);1555kpage[rnum] = virt_to_abs(pg);1556}15571558h_ret = hipz_h_register_rpage_mr(shca->ipz_hca_handle, mr,1559ehca_encode_hwpage_size(pginfo->hwpage_size),15600, rpage, rnum);15611562if ((h_ret != H_SUCCESS) && (h_ret != H_PAGE_REGISTERED)) {1563ehca_err(&shca->ib_device, "register_rpage_mr failed");1564return h_ret;1565}1566}1567return h_ret;1568}15691570static u64 ehca_reg_mr_sections(int top, int dir, u64 *kpage,1571struct ehca_shca *shca, struct ehca_mr *mr,1572struct ehca_mr_pginfo *pginfo)1573{1574u64 hret = H_SUCCESS;1575int idx;15761577for (idx = 0; idx < EHCA_MAP_ENTRIES; idx++) {1578if (!ehca_bmap_valid(ehca_bmap->top[top]->dir[dir]->ent[idx]))1579continue;15801581hret = ehca_reg_mr_section(top, dir, idx, kpage, shca, mr,1582pginfo);1583if ((hret != H_SUCCESS) && (hret != H_PAGE_REGISTERED))1584return hret;1585}1586return hret;1587}15881589static u64 ehca_reg_mr_dir_sections(int top, u64 *kpage, struct ehca_shca *shca,1590struct ehca_mr *mr,1591struct ehca_mr_pginfo *pginfo)1592{1593u64 hret = H_SUCCESS;1594int dir;15951596for (dir = 0; dir < EHCA_MAP_ENTRIES; dir++) {1597if (!ehca_bmap_valid(ehca_bmap->top[top]->dir[dir]))1598continue;15991600hret = ehca_reg_mr_sections(top, dir, kpage, shca, mr, pginfo);1601if ((hret != H_SUCCESS) && (hret != H_PAGE_REGISTERED))1602return hret;1603}1604return hret;1605}16061607/* register internal max-MR to internal SHCA */1608int ehca_reg_internal_maxmr(1609struct ehca_shca *shca,1610struct ehca_pd *e_pd,1611struct ehca_mr **e_maxmr) /*OUT*/1612{1613int ret;1614struct ehca_mr *e_mr;1615u64 *iova_start;1616u64 size_maxmr;1617struct ehca_mr_pginfo pginfo;1618struct ib_phys_buf ib_pbuf;1619u32 num_kpages;1620u32 num_hwpages;1621u64 hw_pgsize;16221623if (!ehca_bmap) {1624ret = -EFAULT;1625goto ehca_reg_internal_maxmr_exit0;1626}16271628e_mr = ehca_mr_new();1629if (!e_mr) {1630ehca_err(&shca->ib_device, "out of memory");1631ret = -ENOMEM;1632goto ehca_reg_internal_maxmr_exit0;1633}1634e_mr->flags |= EHCA_MR_FLAG_MAXMR;16351636/* register internal max-MR on HCA */1637size_maxmr = ehca_mr_len;1638iova_start = (u64 *)ehca_map_vaddr((void *)(KERNELBASE + PHYSICAL_START));1639ib_pbuf.addr = 0;1640ib_pbuf.size = size_maxmr;1641num_kpages = NUM_CHUNKS(((u64)iova_start % PAGE_SIZE) + size_maxmr,1642PAGE_SIZE);1643hw_pgsize = ehca_get_max_hwpage_size(shca);1644num_hwpages = NUM_CHUNKS(((u64)iova_start % hw_pgsize) + size_maxmr,1645hw_pgsize);16461647memset(&pginfo, 0, sizeof(pginfo));1648pginfo.type = EHCA_MR_PGI_PHYS;1649pginfo.num_kpages = num_kpages;1650pginfo.num_hwpages = num_hwpages;1651pginfo.hwpage_size = hw_pgsize;1652pginfo.u.phy.num_phys_buf = 1;1653pginfo.u.phy.phys_buf_array = &ib_pbuf;16541655ret = ehca_reg_mr(shca, e_mr, iova_start, size_maxmr, 0, e_pd,1656&pginfo, &e_mr->ib.ib_mr.lkey,1657&e_mr->ib.ib_mr.rkey, EHCA_REG_BUSMAP_MR);1658if (ret) {1659ehca_err(&shca->ib_device, "reg of internal max MR failed, "1660"e_mr=%p iova_start=%p size_maxmr=%llx num_kpages=%x "1661"num_hwpages=%x", e_mr, iova_start, size_maxmr,1662num_kpages, num_hwpages);1663goto ehca_reg_internal_maxmr_exit1;1664}16651666/* successful registration of all pages */1667e_mr->ib.ib_mr.device = e_pd->ib_pd.device;1668e_mr->ib.ib_mr.pd = &e_pd->ib_pd;1669e_mr->ib.ib_mr.uobject = NULL;1670atomic_inc(&(e_pd->ib_pd.usecnt));1671atomic_set(&(e_mr->ib.ib_mr.usecnt), 0);1672*e_maxmr = e_mr;1673return 0;16741675ehca_reg_internal_maxmr_exit1:1676ehca_mr_delete(e_mr);1677ehca_reg_internal_maxmr_exit0:1678if (ret)1679ehca_err(&shca->ib_device, "ret=%i shca=%p e_pd=%p e_maxmr=%p",1680ret, shca, e_pd, e_maxmr);1681return ret;1682} /* end ehca_reg_internal_maxmr() */16831684/*----------------------------------------------------------------------*/16851686int ehca_reg_maxmr(struct ehca_shca *shca,1687struct ehca_mr *e_newmr,1688u64 *iova_start,1689int acl,1690struct ehca_pd *e_pd,1691u32 *lkey,1692u32 *rkey)1693{1694u64 h_ret;1695struct ehca_mr *e_origmr = shca->maxmr;1696u32 hipz_acl;1697struct ehca_mr_hipzout_parms hipzout;16981699ehca_mrmw_map_acl(acl, &hipz_acl);1700ehca_mrmw_set_pgsize_hipz_acl(e_origmr->hwpage_size, &hipz_acl);17011702h_ret = hipz_h_register_smr(shca->ipz_hca_handle, e_newmr, e_origmr,1703(u64)iova_start, hipz_acl, e_pd->fw_pd,1704&hipzout);1705if (h_ret != H_SUCCESS) {1706ehca_err(&shca->ib_device, "hipz_reg_smr failed, h_ret=%lli "1707"e_origmr=%p hca_hndl=%llx mr_hndl=%llx lkey=%x",1708h_ret, e_origmr, shca->ipz_hca_handle.handle,1709e_origmr->ipz_mr_handle.handle,1710e_origmr->ib.ib_mr.lkey);1711return ehca2ib_return_code(h_ret);1712}1713/* successful registration */1714e_newmr->num_kpages = e_origmr->num_kpages;1715e_newmr->num_hwpages = e_origmr->num_hwpages;1716e_newmr->hwpage_size = e_origmr->hwpage_size;1717e_newmr->start = iova_start;1718e_newmr->size = e_origmr->size;1719e_newmr->acl = acl;1720e_newmr->ipz_mr_handle = hipzout.handle;1721*lkey = hipzout.lkey;1722*rkey = hipzout.rkey;1723return 0;1724} /* end ehca_reg_maxmr() */17251726/*----------------------------------------------------------------------*/17271728int ehca_dereg_internal_maxmr(struct ehca_shca *shca)1729{1730int ret;1731struct ehca_mr *e_maxmr;1732struct ib_pd *ib_pd;17331734if (!shca->maxmr) {1735ehca_err(&shca->ib_device, "bad call, shca=%p", shca);1736ret = -EINVAL;1737goto ehca_dereg_internal_maxmr_exit0;1738}17391740e_maxmr = shca->maxmr;1741ib_pd = e_maxmr->ib.ib_mr.pd;1742shca->maxmr = NULL; /* remove internal max-MR indication from SHCA */17431744ret = ehca_dereg_mr(&e_maxmr->ib.ib_mr);1745if (ret) {1746ehca_err(&shca->ib_device, "dereg internal max-MR failed, "1747"ret=%i e_maxmr=%p shca=%p lkey=%x",1748ret, e_maxmr, shca, e_maxmr->ib.ib_mr.lkey);1749shca->maxmr = e_maxmr;1750goto ehca_dereg_internal_maxmr_exit0;1751}17521753atomic_dec(&ib_pd->usecnt);17541755ehca_dereg_internal_maxmr_exit0:1756if (ret)1757ehca_err(&shca->ib_device, "ret=%i shca=%p shca->maxmr=%p",1758ret, shca, shca->maxmr);1759return ret;1760} /* end ehca_dereg_internal_maxmr() */17611762/*----------------------------------------------------------------------*/17631764/*1765* check physical buffer array of MR verbs for validness and1766* calculates MR size1767*/1768int ehca_mr_chk_buf_and_calc_size(struct ib_phys_buf *phys_buf_array,1769int num_phys_buf,1770u64 *iova_start,1771u64 *size)1772{1773struct ib_phys_buf *pbuf = phys_buf_array;1774u64 size_count = 0;1775u32 i;17761777if (num_phys_buf == 0) {1778ehca_gen_err("bad phys buf array len, num_phys_buf=0");1779return -EINVAL;1780}1781/* check first buffer */1782if (((u64)iova_start & ~PAGE_MASK) != (pbuf->addr & ~PAGE_MASK)) {1783ehca_gen_err("iova_start/addr mismatch, iova_start=%p "1784"pbuf->addr=%llx pbuf->size=%llx",1785iova_start, pbuf->addr, pbuf->size);1786return -EINVAL;1787}1788if (((pbuf->addr + pbuf->size) % PAGE_SIZE) &&1789(num_phys_buf > 1)) {1790ehca_gen_err("addr/size mismatch in 1st buf, pbuf->addr=%llx "1791"pbuf->size=%llx", pbuf->addr, pbuf->size);1792return -EINVAL;1793}17941795for (i = 0; i < num_phys_buf; i++) {1796if ((i > 0) && (pbuf->addr % PAGE_SIZE)) {1797ehca_gen_err("bad address, i=%x pbuf->addr=%llx "1798"pbuf->size=%llx",1799i, pbuf->addr, pbuf->size);1800return -EINVAL;1801}1802if (((i > 0) && /* not 1st */1803(i < (num_phys_buf - 1)) && /* not last */1804(pbuf->size % PAGE_SIZE)) || (pbuf->size == 0)) {1805ehca_gen_err("bad size, i=%x pbuf->size=%llx",1806i, pbuf->size);1807return -EINVAL;1808}1809size_count += pbuf->size;1810pbuf++;1811}18121813*size = size_count;1814return 0;1815} /* end ehca_mr_chk_buf_and_calc_size() */18161817/*----------------------------------------------------------------------*/18181819/* check page list of map FMR verb for validness */1820int ehca_fmr_check_page_list(struct ehca_mr *e_fmr,1821u64 *page_list,1822int list_len)1823{1824u32 i;1825u64 *page;18261827if ((list_len == 0) || (list_len > e_fmr->fmr_max_pages)) {1828ehca_gen_err("bad list_len, list_len=%x "1829"e_fmr->fmr_max_pages=%x fmr=%p",1830list_len, e_fmr->fmr_max_pages, e_fmr);1831return -EINVAL;1832}18331834/* each page must be aligned */1835page = page_list;1836for (i = 0; i < list_len; i++) {1837if (*page % e_fmr->fmr_page_size) {1838ehca_gen_err("bad page, i=%x *page=%llx page=%p fmr=%p "1839"fmr_page_size=%x", i, *page, page, e_fmr,1840e_fmr->fmr_page_size);1841return -EINVAL;1842}1843page++;1844}18451846return 0;1847} /* end ehca_fmr_check_page_list() */18481849/*----------------------------------------------------------------------*/18501851/* PAGE_SIZE >= pginfo->hwpage_size */1852static int ehca_set_pagebuf_user1(struct ehca_mr_pginfo *pginfo,1853u32 number,1854u64 *kpage)1855{1856int ret = 0;1857struct ib_umem_chunk *prev_chunk;1858struct ib_umem_chunk *chunk;1859u64 pgaddr;1860u32 i = 0;1861u32 j = 0;1862int hwpages_per_kpage = PAGE_SIZE / pginfo->hwpage_size;18631864/* loop over desired chunk entries */1865chunk = pginfo->u.usr.next_chunk;1866prev_chunk = pginfo->u.usr.next_chunk;1867list_for_each_entry_continue(1868chunk, (&(pginfo->u.usr.region->chunk_list)), list) {1869for (i = pginfo->u.usr.next_nmap; i < chunk->nmap; ) {1870pgaddr = page_to_pfn(sg_page(&chunk->page_list[i]))1871<< PAGE_SHIFT ;1872*kpage = phys_to_abs(pgaddr +1873(pginfo->next_hwpage *1874pginfo->hwpage_size));1875if ( !(*kpage) ) {1876ehca_gen_err("pgaddr=%llx "1877"chunk->page_list[i]=%llx "1878"i=%x next_hwpage=%llx",1879pgaddr, (u64)sg_dma_address(1880&chunk->page_list[i]),1881i, pginfo->next_hwpage);1882return -EFAULT;1883}1884(pginfo->hwpage_cnt)++;1885(pginfo->next_hwpage)++;1886kpage++;1887if (pginfo->next_hwpage % hwpages_per_kpage == 0) {1888(pginfo->kpage_cnt)++;1889(pginfo->u.usr.next_nmap)++;1890pginfo->next_hwpage = 0;1891i++;1892}1893j++;1894if (j >= number) break;1895}1896if ((pginfo->u.usr.next_nmap >= chunk->nmap) &&1897(j >= number)) {1898pginfo->u.usr.next_nmap = 0;1899prev_chunk = chunk;1900break;1901} else if (pginfo->u.usr.next_nmap >= chunk->nmap) {1902pginfo->u.usr.next_nmap = 0;1903prev_chunk = chunk;1904} else if (j >= number)1905break;1906else1907prev_chunk = chunk;1908}1909pginfo->u.usr.next_chunk =1910list_prepare_entry(prev_chunk,1911(&(pginfo->u.usr.region->chunk_list)),1912list);1913return ret;1914}19151916/*1917* check given pages for contiguous layout1918* last page addr is returned in prev_pgaddr for further check1919*/1920static int ehca_check_kpages_per_ate(struct scatterlist *page_list,1921int start_idx, int end_idx,1922u64 *prev_pgaddr)1923{1924int t;1925for (t = start_idx; t <= end_idx; t++) {1926u64 pgaddr = page_to_pfn(sg_page(&page_list[t])) << PAGE_SHIFT;1927if (ehca_debug_level >= 3)1928ehca_gen_dbg("chunk_page=%llx value=%016llx", pgaddr,1929*(u64 *)abs_to_virt(phys_to_abs(pgaddr)));1930if (pgaddr - PAGE_SIZE != *prev_pgaddr) {1931ehca_gen_err("uncontiguous page found pgaddr=%llx "1932"prev_pgaddr=%llx page_list_i=%x",1933pgaddr, *prev_pgaddr, t);1934return -EINVAL;1935}1936*prev_pgaddr = pgaddr;1937}1938return 0;1939}19401941/* PAGE_SIZE < pginfo->hwpage_size */1942static int ehca_set_pagebuf_user2(struct ehca_mr_pginfo *pginfo,1943u32 number,1944u64 *kpage)1945{1946int ret = 0;1947struct ib_umem_chunk *prev_chunk;1948struct ib_umem_chunk *chunk;1949u64 pgaddr, prev_pgaddr;1950u32 i = 0;1951u32 j = 0;1952int kpages_per_hwpage = pginfo->hwpage_size / PAGE_SIZE;1953int nr_kpages = kpages_per_hwpage;19541955/* loop over desired chunk entries */1956chunk = pginfo->u.usr.next_chunk;1957prev_chunk = pginfo->u.usr.next_chunk;1958list_for_each_entry_continue(1959chunk, (&(pginfo->u.usr.region->chunk_list)), list) {1960for (i = pginfo->u.usr.next_nmap; i < chunk->nmap; ) {1961if (nr_kpages == kpages_per_hwpage) {1962pgaddr = ( page_to_pfn(sg_page(&chunk->page_list[i]))1963<< PAGE_SHIFT );1964*kpage = phys_to_abs(pgaddr);1965if ( !(*kpage) ) {1966ehca_gen_err("pgaddr=%llx i=%x",1967pgaddr, i);1968ret = -EFAULT;1969return ret;1970}1971/*1972* The first page in a hwpage must be aligned;1973* the first MR page is exempt from this rule.1974*/1975if (pgaddr & (pginfo->hwpage_size - 1)) {1976if (pginfo->hwpage_cnt) {1977ehca_gen_err(1978"invalid alignment "1979"pgaddr=%llx i=%x "1980"mr_pgsize=%llx",1981pgaddr, i,1982pginfo->hwpage_size);1983ret = -EFAULT;1984return ret;1985}1986/* first MR page */1987pginfo->kpage_cnt =1988(pgaddr &1989(pginfo->hwpage_size - 1)) >>1990PAGE_SHIFT;1991nr_kpages -= pginfo->kpage_cnt;1992*kpage = phys_to_abs(1993pgaddr &1994~(pginfo->hwpage_size - 1));1995}1996if (ehca_debug_level >= 3) {1997u64 val = *(u64 *)abs_to_virt(1998phys_to_abs(pgaddr));1999ehca_gen_dbg("kpage=%llx chunk_page=%llx "2000"value=%016llx",2001*kpage, pgaddr, val);2002}2003prev_pgaddr = pgaddr;2004i++;2005pginfo->kpage_cnt++;2006pginfo->u.usr.next_nmap++;2007nr_kpages--;2008if (!nr_kpages)2009goto next_kpage;2010continue;2011}2012if (i + nr_kpages > chunk->nmap) {2013ret = ehca_check_kpages_per_ate(2014chunk->page_list, i,2015chunk->nmap - 1, &prev_pgaddr);2016if (ret) return ret;2017pginfo->kpage_cnt += chunk->nmap - i;2018pginfo->u.usr.next_nmap += chunk->nmap - i;2019nr_kpages -= chunk->nmap - i;2020break;2021}20222023ret = ehca_check_kpages_per_ate(chunk->page_list, i,2024i + nr_kpages - 1,2025&prev_pgaddr);2026if (ret) return ret;2027i += nr_kpages;2028pginfo->kpage_cnt += nr_kpages;2029pginfo->u.usr.next_nmap += nr_kpages;2030next_kpage:2031nr_kpages = kpages_per_hwpage;2032(pginfo->hwpage_cnt)++;2033kpage++;2034j++;2035if (j >= number) break;2036}2037if ((pginfo->u.usr.next_nmap >= chunk->nmap) &&2038(j >= number)) {2039pginfo->u.usr.next_nmap = 0;2040prev_chunk = chunk;2041break;2042} else if (pginfo->u.usr.next_nmap >= chunk->nmap) {2043pginfo->u.usr.next_nmap = 0;2044prev_chunk = chunk;2045} else if (j >= number)2046break;2047else2048prev_chunk = chunk;2049}2050pginfo->u.usr.next_chunk =2051list_prepare_entry(prev_chunk,2052(&(pginfo->u.usr.region->chunk_list)),2053list);2054return ret;2055}20562057static int ehca_set_pagebuf_phys(struct ehca_mr_pginfo *pginfo,2058u32 number, u64 *kpage)2059{2060int ret = 0;2061struct ib_phys_buf *pbuf;2062u64 num_hw, offs_hw;2063u32 i = 0;20642065/* loop over desired phys_buf_array entries */2066while (i < number) {2067pbuf = pginfo->u.phy.phys_buf_array + pginfo->u.phy.next_buf;2068num_hw = NUM_CHUNKS((pbuf->addr % pginfo->hwpage_size) +2069pbuf->size, pginfo->hwpage_size);2070offs_hw = (pbuf->addr & ~(pginfo->hwpage_size - 1)) /2071pginfo->hwpage_size;2072while (pginfo->next_hwpage < offs_hw + num_hw) {2073/* sanity check */2074if ((pginfo->kpage_cnt >= pginfo->num_kpages) ||2075(pginfo->hwpage_cnt >= pginfo->num_hwpages)) {2076ehca_gen_err("kpage_cnt >= num_kpages, "2077"kpage_cnt=%llx num_kpages=%llx "2078"hwpage_cnt=%llx "2079"num_hwpages=%llx i=%x",2080pginfo->kpage_cnt,2081pginfo->num_kpages,2082pginfo->hwpage_cnt,2083pginfo->num_hwpages, i);2084return -EFAULT;2085}2086*kpage = phys_to_abs(2087(pbuf->addr & ~(pginfo->hwpage_size - 1)) +2088(pginfo->next_hwpage * pginfo->hwpage_size));2089if ( !(*kpage) && pbuf->addr ) {2090ehca_gen_err("pbuf->addr=%llx pbuf->size=%llx "2091"next_hwpage=%llx", pbuf->addr,2092pbuf->size, pginfo->next_hwpage);2093return -EFAULT;2094}2095(pginfo->hwpage_cnt)++;2096(pginfo->next_hwpage)++;2097if (PAGE_SIZE >= pginfo->hwpage_size) {2098if (pginfo->next_hwpage %2099(PAGE_SIZE / pginfo->hwpage_size) == 0)2100(pginfo->kpage_cnt)++;2101} else2102pginfo->kpage_cnt += pginfo->hwpage_size /2103PAGE_SIZE;2104kpage++;2105i++;2106if (i >= number) break;2107}2108if (pginfo->next_hwpage >= offs_hw + num_hw) {2109(pginfo->u.phy.next_buf)++;2110pginfo->next_hwpage = 0;2111}2112}2113return ret;2114}21152116static int ehca_set_pagebuf_fmr(struct ehca_mr_pginfo *pginfo,2117u32 number, u64 *kpage)2118{2119int ret = 0;2120u64 *fmrlist;2121u32 i;21222123/* loop over desired page_list entries */2124fmrlist = pginfo->u.fmr.page_list + pginfo->u.fmr.next_listelem;2125for (i = 0; i < number; i++) {2126*kpage = phys_to_abs((*fmrlist & ~(pginfo->hwpage_size - 1)) +2127pginfo->next_hwpage * pginfo->hwpage_size);2128if ( !(*kpage) ) {2129ehca_gen_err("*fmrlist=%llx fmrlist=%p "2130"next_listelem=%llx next_hwpage=%llx",2131*fmrlist, fmrlist,2132pginfo->u.fmr.next_listelem,2133pginfo->next_hwpage);2134return -EFAULT;2135}2136(pginfo->hwpage_cnt)++;2137if (pginfo->u.fmr.fmr_pgsize >= pginfo->hwpage_size) {2138if (pginfo->next_hwpage %2139(pginfo->u.fmr.fmr_pgsize /2140pginfo->hwpage_size) == 0) {2141(pginfo->kpage_cnt)++;2142(pginfo->u.fmr.next_listelem)++;2143fmrlist++;2144pginfo->next_hwpage = 0;2145} else2146(pginfo->next_hwpage)++;2147} else {2148unsigned int cnt_per_hwpage = pginfo->hwpage_size /2149pginfo->u.fmr.fmr_pgsize;2150unsigned int j;2151u64 prev = *kpage;2152/* check if adrs are contiguous */2153for (j = 1; j < cnt_per_hwpage; j++) {2154u64 p = phys_to_abs(fmrlist[j] &2155~(pginfo->hwpage_size - 1));2156if (prev + pginfo->u.fmr.fmr_pgsize != p) {2157ehca_gen_err("uncontiguous fmr pages "2158"found prev=%llx p=%llx "2159"idx=%x", prev, p, i + j);2160return -EINVAL;2161}2162prev = p;2163}2164pginfo->kpage_cnt += cnt_per_hwpage;2165pginfo->u.fmr.next_listelem += cnt_per_hwpage;2166fmrlist += cnt_per_hwpage;2167}2168kpage++;2169}2170return ret;2171}21722173/* setup page buffer from page info */2174int ehca_set_pagebuf(struct ehca_mr_pginfo *pginfo,2175u32 number,2176u64 *kpage)2177{2178int ret;21792180switch (pginfo->type) {2181case EHCA_MR_PGI_PHYS:2182ret = ehca_set_pagebuf_phys(pginfo, number, kpage);2183break;2184case EHCA_MR_PGI_USER:2185ret = PAGE_SIZE >= pginfo->hwpage_size ?2186ehca_set_pagebuf_user1(pginfo, number, kpage) :2187ehca_set_pagebuf_user2(pginfo, number, kpage);2188break;2189case EHCA_MR_PGI_FMR:2190ret = ehca_set_pagebuf_fmr(pginfo, number, kpage);2191break;2192default:2193ehca_gen_err("bad pginfo->type=%x", pginfo->type);2194ret = -EFAULT;2195break;2196}2197return ret;2198} /* end ehca_set_pagebuf() */21992200/*----------------------------------------------------------------------*/22012202/*2203* check MR if it is a max-MR, i.e. uses whole memory2204* in case it's a max-MR 1 is returned, else 02205*/2206int ehca_mr_is_maxmr(u64 size,2207u64 *iova_start)2208{2209/* a MR is treated as max-MR only if it fits following: */2210if ((size == ehca_mr_len) &&2211(iova_start == (void *)ehca_map_vaddr((void *)(KERNELBASE + PHYSICAL_START)))) {2212ehca_gen_dbg("this is a max-MR");2213return 1;2214} else2215return 0;2216} /* end ehca_mr_is_maxmr() */22172218/*----------------------------------------------------------------------*/22192220/* map access control for MR/MW. This routine is used for MR and MW. */2221void ehca_mrmw_map_acl(int ib_acl,2222u32 *hipz_acl)2223{2224*hipz_acl = 0;2225if (ib_acl & IB_ACCESS_REMOTE_READ)2226*hipz_acl |= HIPZ_ACCESSCTRL_R_READ;2227if (ib_acl & IB_ACCESS_REMOTE_WRITE)2228*hipz_acl |= HIPZ_ACCESSCTRL_R_WRITE;2229if (ib_acl & IB_ACCESS_REMOTE_ATOMIC)2230*hipz_acl |= HIPZ_ACCESSCTRL_R_ATOMIC;2231if (ib_acl & IB_ACCESS_LOCAL_WRITE)2232*hipz_acl |= HIPZ_ACCESSCTRL_L_WRITE;2233if (ib_acl & IB_ACCESS_MW_BIND)2234*hipz_acl |= HIPZ_ACCESSCTRL_MW_BIND;2235} /* end ehca_mrmw_map_acl() */22362237/*----------------------------------------------------------------------*/22382239/* sets page size in hipz access control for MR/MW. */2240void ehca_mrmw_set_pgsize_hipz_acl(u32 pgsize, u32 *hipz_acl) /*INOUT*/2241{2242*hipz_acl |= (ehca_encode_hwpage_size(pgsize) << 24);2243} /* end ehca_mrmw_set_pgsize_hipz_acl() */22442245/*----------------------------------------------------------------------*/22462247/*2248* reverse map access control for MR/MW.2249* This routine is used for MR and MW.2250*/2251void ehca_mrmw_reverse_map_acl(const u32 *hipz_acl,2252int *ib_acl) /*OUT*/2253{2254*ib_acl = 0;2255if (*hipz_acl & HIPZ_ACCESSCTRL_R_READ)2256*ib_acl |= IB_ACCESS_REMOTE_READ;2257if (*hipz_acl & HIPZ_ACCESSCTRL_R_WRITE)2258*ib_acl |= IB_ACCESS_REMOTE_WRITE;2259if (*hipz_acl & HIPZ_ACCESSCTRL_R_ATOMIC)2260*ib_acl |= IB_ACCESS_REMOTE_ATOMIC;2261if (*hipz_acl & HIPZ_ACCESSCTRL_L_WRITE)2262*ib_acl |= IB_ACCESS_LOCAL_WRITE;2263if (*hipz_acl & HIPZ_ACCESSCTRL_MW_BIND)2264*ib_acl |= IB_ACCESS_MW_BIND;2265} /* end ehca_mrmw_reverse_map_acl() */226622672268/*----------------------------------------------------------------------*/22692270/*2271* MR destructor and constructor2272* used in Reregister MR verb, sets all fields in ehca_mr_t to 0,2273* except struct ib_mr and spinlock2274*/2275void ehca_mr_deletenew(struct ehca_mr *mr)2276{2277mr->flags = 0;2278mr->num_kpages = 0;2279mr->num_hwpages = 0;2280mr->acl = 0;2281mr->start = NULL;2282mr->fmr_page_size = 0;2283mr->fmr_max_pages = 0;2284mr->fmr_max_maps = 0;2285mr->fmr_map_cnt = 0;2286memset(&mr->ipz_mr_handle, 0, sizeof(mr->ipz_mr_handle));2287memset(&mr->galpas, 0, sizeof(mr->galpas));2288} /* end ehca_mr_deletenew() */22892290int ehca_init_mrmw_cache(void)2291{2292mr_cache = kmem_cache_create("ehca_cache_mr",2293sizeof(struct ehca_mr), 0,2294SLAB_HWCACHE_ALIGN,2295NULL);2296if (!mr_cache)2297return -ENOMEM;2298mw_cache = kmem_cache_create("ehca_cache_mw",2299sizeof(struct ehca_mw), 0,2300SLAB_HWCACHE_ALIGN,2301NULL);2302if (!mw_cache) {2303kmem_cache_destroy(mr_cache);2304mr_cache = NULL;2305return -ENOMEM;2306}2307return 0;2308}23092310void ehca_cleanup_mrmw_cache(void)2311{2312if (mr_cache)2313kmem_cache_destroy(mr_cache);2314if (mw_cache)2315kmem_cache_destroy(mw_cache);2316}23172318static inline int ehca_init_top_bmap(struct ehca_top_bmap *ehca_top_bmap,2319int dir)2320{2321if (!ehca_bmap_valid(ehca_top_bmap->dir[dir])) {2322ehca_top_bmap->dir[dir] =2323kmalloc(sizeof(struct ehca_dir_bmap), GFP_KERNEL);2324if (!ehca_top_bmap->dir[dir])2325return -ENOMEM;2326/* Set map block to 0xFF according to EHCA_INVAL_ADDR */2327memset(ehca_top_bmap->dir[dir], 0xFF, EHCA_ENT_MAP_SIZE);2328}2329return 0;2330}23312332static inline int ehca_init_bmap(struct ehca_bmap *ehca_bmap, int top, int dir)2333{2334if (!ehca_bmap_valid(ehca_bmap->top[top])) {2335ehca_bmap->top[top] =2336kmalloc(sizeof(struct ehca_top_bmap), GFP_KERNEL);2337if (!ehca_bmap->top[top])2338return -ENOMEM;2339/* Set map block to 0xFF according to EHCA_INVAL_ADDR */2340memset(ehca_bmap->top[top], 0xFF, EHCA_DIR_MAP_SIZE);2341}2342return ehca_init_top_bmap(ehca_bmap->top[top], dir);2343}23442345static inline int ehca_calc_index(unsigned long i, unsigned long s)2346{2347return (i >> s) & EHCA_INDEX_MASK;2348}23492350void ehca_destroy_busmap(void)2351{2352int top, dir;23532354if (!ehca_bmap)2355return;23562357for (top = 0; top < EHCA_MAP_ENTRIES; top++) {2358if (!ehca_bmap_valid(ehca_bmap->top[top]))2359continue;2360for (dir = 0; dir < EHCA_MAP_ENTRIES; dir++) {2361if (!ehca_bmap_valid(ehca_bmap->top[top]->dir[dir]))2362continue;23632364kfree(ehca_bmap->top[top]->dir[dir]);2365}23662367kfree(ehca_bmap->top[top]);2368}23692370kfree(ehca_bmap);2371ehca_bmap = NULL;2372}23732374static int ehca_update_busmap(unsigned long pfn, unsigned long nr_pages)2375{2376unsigned long i, start_section, end_section;2377int top, dir, idx;23782379if (!nr_pages)2380return 0;23812382if (!ehca_bmap) {2383ehca_bmap = kmalloc(sizeof(struct ehca_bmap), GFP_KERNEL);2384if (!ehca_bmap)2385return -ENOMEM;2386/* Set map block to 0xFF according to EHCA_INVAL_ADDR */2387memset(ehca_bmap, 0xFF, EHCA_TOP_MAP_SIZE);2388}23892390start_section = phys_to_abs(pfn * PAGE_SIZE) / EHCA_SECTSIZE;2391end_section = phys_to_abs((pfn + nr_pages) * PAGE_SIZE) / EHCA_SECTSIZE;2392for (i = start_section; i < end_section; i++) {2393int ret;2394top = ehca_calc_index(i, EHCA_TOP_INDEX_SHIFT);2395dir = ehca_calc_index(i, EHCA_DIR_INDEX_SHIFT);2396idx = i & EHCA_INDEX_MASK;23972398ret = ehca_init_bmap(ehca_bmap, top, dir);2399if (ret) {2400ehca_destroy_busmap();2401return ret;2402}2403ehca_bmap->top[top]->dir[dir]->ent[idx] = ehca_mr_len;2404ehca_mr_len += EHCA_SECTSIZE;2405}2406return 0;2407}24082409static int ehca_is_hugepage(unsigned long pfn)2410{2411int page_order;24122413if (pfn & EHCA_HUGEPAGE_PFN_MASK)2414return 0;24152416page_order = compound_order(pfn_to_page(pfn));2417if (page_order + PAGE_SHIFT != EHCA_HUGEPAGESHIFT)2418return 0;24192420return 1;2421}24222423static int ehca_create_busmap_callback(unsigned long initial_pfn,2424unsigned long total_nr_pages, void *arg)2425{2426int ret;2427unsigned long pfn, start_pfn, end_pfn, nr_pages;24282429if ((total_nr_pages * PAGE_SIZE) < EHCA_HUGEPAGE_SIZE)2430return ehca_update_busmap(initial_pfn, total_nr_pages);24312432/* Given chunk is >= 16GB -> check for hugepages */2433start_pfn = initial_pfn;2434end_pfn = initial_pfn + total_nr_pages;2435pfn = start_pfn;24362437while (pfn < end_pfn) {2438if (ehca_is_hugepage(pfn)) {2439/* Add mem found in front of the hugepage */2440nr_pages = pfn - start_pfn;2441ret = ehca_update_busmap(start_pfn, nr_pages);2442if (ret)2443return ret;2444/* Skip the hugepage */2445pfn += (EHCA_HUGEPAGE_SIZE / PAGE_SIZE);2446start_pfn = pfn;2447} else2448pfn += (EHCA_SECTSIZE / PAGE_SIZE);2449}24502451/* Add mem found behind the hugepage(s) */2452nr_pages = pfn - start_pfn;2453return ehca_update_busmap(start_pfn, nr_pages);2454}24552456int ehca_create_busmap(void)2457{2458int ret;24592460ehca_mr_len = 0;2461ret = walk_system_ram_range(0, 1ULL << MAX_PHYSMEM_BITS, NULL,2462ehca_create_busmap_callback);2463return ret;2464}24652466static int ehca_reg_bmap_mr_rpages(struct ehca_shca *shca,2467struct ehca_mr *e_mr,2468struct ehca_mr_pginfo *pginfo)2469{2470int top;2471u64 hret, *kpage;24722473kpage = ehca_alloc_fw_ctrlblock(GFP_KERNEL);2474if (!kpage) {2475ehca_err(&shca->ib_device, "kpage alloc failed");2476return -ENOMEM;2477}2478for (top = 0; top < EHCA_MAP_ENTRIES; top++) {2479if (!ehca_bmap_valid(ehca_bmap->top[top]))2480continue;2481hret = ehca_reg_mr_dir_sections(top, kpage, shca, e_mr, pginfo);2482if ((hret != H_PAGE_REGISTERED) && (hret != H_SUCCESS))2483break;2484}24852486ehca_free_fw_ctrlblock(kpage);24872488if (hret == H_SUCCESS)2489return 0; /* Everything is fine */2490else {2491ehca_err(&shca->ib_device, "ehca_reg_bmap_mr_rpages failed, "2492"h_ret=%lli e_mr=%p top=%x lkey=%x "2493"hca_hndl=%llx mr_hndl=%llx", hret, e_mr, top,2494e_mr->ib.ib_mr.lkey,2495shca->ipz_hca_handle.handle,2496e_mr->ipz_mr_handle.handle);2497return ehca2ib_return_code(hret);2498}2499}25002501static u64 ehca_map_vaddr(void *caddr)2502{2503int top, dir, idx;2504unsigned long abs_addr, offset;2505u64 entry;25062507if (!ehca_bmap)2508return EHCA_INVAL_ADDR;25092510abs_addr = virt_to_abs(caddr);2511top = ehca_calc_index(abs_addr, EHCA_TOP_INDEX_SHIFT + EHCA_SECTSHIFT);2512if (!ehca_bmap_valid(ehca_bmap->top[top]))2513return EHCA_INVAL_ADDR;25142515dir = ehca_calc_index(abs_addr, EHCA_DIR_INDEX_SHIFT + EHCA_SECTSHIFT);2516if (!ehca_bmap_valid(ehca_bmap->top[top]->dir[dir]))2517return EHCA_INVAL_ADDR;25182519idx = ehca_calc_index(abs_addr, EHCA_SECTSHIFT);25202521entry = ehca_bmap->top[top]->dir[dir]->ent[idx];2522if (ehca_bmap_valid(entry)) {2523offset = (unsigned long)caddr & (EHCA_SECTSIZE - 1);2524return entry | offset;2525} else2526return EHCA_INVAL_ADDR;2527}25282529static int ehca_dma_mapping_error(struct ib_device *dev, u64 dma_addr)2530{2531return dma_addr == EHCA_INVAL_ADDR;2532}25332534static u64 ehca_dma_map_single(struct ib_device *dev, void *cpu_addr,2535size_t size, enum dma_data_direction direction)2536{2537if (cpu_addr)2538return ehca_map_vaddr(cpu_addr);2539else2540return EHCA_INVAL_ADDR;2541}25422543static void ehca_dma_unmap_single(struct ib_device *dev, u64 addr, size_t size,2544enum dma_data_direction direction)2545{2546/* This is only a stub; nothing to be done here */2547}25482549static u64 ehca_dma_map_page(struct ib_device *dev, struct page *page,2550unsigned long offset, size_t size,2551enum dma_data_direction direction)2552{2553u64 addr;25542555if (offset + size > PAGE_SIZE)2556return EHCA_INVAL_ADDR;25572558addr = ehca_map_vaddr(page_address(page));2559if (!ehca_dma_mapping_error(dev, addr))2560addr += offset;25612562return addr;2563}25642565static void ehca_dma_unmap_page(struct ib_device *dev, u64 addr, size_t size,2566enum dma_data_direction direction)2567{2568/* This is only a stub; nothing to be done here */2569}25702571static int ehca_dma_map_sg(struct ib_device *dev, struct scatterlist *sgl,2572int nents, enum dma_data_direction direction)2573{2574struct scatterlist *sg;2575int i;25762577for_each_sg(sgl, sg, nents, i) {2578u64 addr;2579addr = ehca_map_vaddr(sg_virt(sg));2580if (ehca_dma_mapping_error(dev, addr))2581return 0;25822583sg->dma_address = addr;2584sg->dma_length = sg->length;2585}2586return nents;2587}25882589static void ehca_dma_unmap_sg(struct ib_device *dev, struct scatterlist *sg,2590int nents, enum dma_data_direction direction)2591{2592/* This is only a stub; nothing to be done here */2593}25942595static u64 ehca_dma_address(struct ib_device *dev, struct scatterlist *sg)2596{2597return sg->dma_address;2598}25992600static unsigned int ehca_dma_len(struct ib_device *dev, struct scatterlist *sg)2601{2602return sg->length;2603}26042605static void ehca_dma_sync_single_for_cpu(struct ib_device *dev, u64 addr,2606size_t size,2607enum dma_data_direction dir)2608{2609dma_sync_single_for_cpu(dev->dma_device, addr, size, dir);2610}26112612static void ehca_dma_sync_single_for_device(struct ib_device *dev, u64 addr,2613size_t size,2614enum dma_data_direction dir)2615{2616dma_sync_single_for_device(dev->dma_device, addr, size, dir);2617}26182619static void *ehca_dma_alloc_coherent(struct ib_device *dev, size_t size,2620u64 *dma_handle, gfp_t flag)2621{2622struct page *p;2623void *addr = NULL;2624u64 dma_addr;26252626p = alloc_pages(flag, get_order(size));2627if (p) {2628addr = page_address(p);2629dma_addr = ehca_map_vaddr(addr);2630if (ehca_dma_mapping_error(dev, dma_addr)) {2631free_pages((unsigned long)addr, get_order(size));2632return NULL;2633}2634if (dma_handle)2635*dma_handle = dma_addr;2636return addr;2637}2638return NULL;2639}26402641static void ehca_dma_free_coherent(struct ib_device *dev, size_t size,2642void *cpu_addr, u64 dma_handle)2643{2644if (cpu_addr && size)2645free_pages((unsigned long)cpu_addr, get_order(size));2646}264726482649struct ib_dma_mapping_ops ehca_dma_mapping_ops = {2650.mapping_error = ehca_dma_mapping_error,2651.map_single = ehca_dma_map_single,2652.unmap_single = ehca_dma_unmap_single,2653.map_page = ehca_dma_map_page,2654.unmap_page = ehca_dma_unmap_page,2655.map_sg = ehca_dma_map_sg,2656.unmap_sg = ehca_dma_unmap_sg,2657.dma_address = ehca_dma_address,2658.dma_len = ehca_dma_len,2659.sync_single_for_cpu = ehca_dma_sync_single_for_cpu,2660.sync_single_for_device = ehca_dma_sync_single_for_device,2661.alloc_coherent = ehca_dma_alloc_coherent,2662.free_coherent = ehca_dma_free_coherent,2663};266426652666