1eb3ae0aaSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only 267f4addbSFrank Haverkamp /** 367f4addbSFrank Haverkamp * IBM Accelerator Family 'GenWQE' 467f4addbSFrank Haverkamp * 567f4addbSFrank Haverkamp * (C) Copyright IBM Corp. 2013 667f4addbSFrank Haverkamp * 767f4addbSFrank Haverkamp * Author: Frank Haverkamp <haver@linux.vnet.ibm.com> 867f4addbSFrank Haverkamp * Author: Joerg-Stephan Vogt <jsvogt@de.ibm.com> 926d8f6f1SFrank Haverkamp * Author: Michael Jung <mijung@gmx.net> 1067f4addbSFrank Haverkamp * Author: Michael Ruettger <michael@ibmra.de> 1167f4addbSFrank Haverkamp */ 1267f4addbSFrank Haverkamp 1367f4addbSFrank Haverkamp /* 1467f4addbSFrank Haverkamp * Miscelanous functionality used in the other GenWQE driver parts. 1567f4addbSFrank Haverkamp */ 1667f4addbSFrank Haverkamp 1767f4addbSFrank Haverkamp #include <linux/kernel.h> 1867f4addbSFrank Haverkamp #include <linux/sched.h> 1967f4addbSFrank Haverkamp #include <linux/vmalloc.h> 2067f4addbSFrank Haverkamp #include <linux/page-flags.h> 2167f4addbSFrank Haverkamp #include <linux/scatterlist.h> 2267f4addbSFrank Haverkamp #include <linux/hugetlb.h> 2367f4addbSFrank Haverkamp #include <linux/iommu.h> 2467f4addbSFrank Haverkamp #include <linux/pci.h> 2567f4addbSFrank Haverkamp #include <linux/dma-mapping.h> 2667f4addbSFrank Haverkamp #include <linux/ctype.h> 2767f4addbSFrank Haverkamp #include <linux/module.h> 2867f4addbSFrank Haverkamp #include <linux/platform_device.h> 2967f4addbSFrank Haverkamp #include <linux/delay.h> 3067f4addbSFrank Haverkamp #include <asm/pgtable.h> 3167f4addbSFrank Haverkamp 3267f4addbSFrank Haverkamp #include "genwqe_driver.h" 3367f4addbSFrank Haverkamp #include "card_base.h" 3467f4addbSFrank Haverkamp #include "card_ddcb.h" 3567f4addbSFrank Haverkamp 3667f4addbSFrank Haverkamp /** 3767f4addbSFrank Haverkamp * __genwqe_writeq() - Write 64-bit register 3867f4addbSFrank Haverkamp * @cd: genwqe device descriptor 3967f4addbSFrank Haverkamp * @byte_offs: byte offset within BAR 4067f4addbSFrank Haverkamp * @val: 64-bit value 4167f4addbSFrank Haverkamp * 4267f4addbSFrank Haverkamp * Return: 0 if success; < 0 if error 4367f4addbSFrank Haverkamp */ 4467f4addbSFrank Haverkamp int __genwqe_writeq(struct genwqe_dev *cd, u64 byte_offs, u64 val) 4567f4addbSFrank Haverkamp { 46fb145456SKleber Sacilotto de Souza struct pci_dev *pci_dev = cd->pci_dev; 47fb145456SKleber Sacilotto de Souza 4867f4addbSFrank Haverkamp if (cd->err_inject & GENWQE_INJECT_HARDWARE_FAILURE) 4967f4addbSFrank Haverkamp return -EIO; 5067f4addbSFrank Haverkamp 5167f4addbSFrank Haverkamp if (cd->mmio == NULL) 5267f4addbSFrank Haverkamp return -EIO; 5367f4addbSFrank Haverkamp 54fb145456SKleber Sacilotto de Souza if (pci_channel_offline(pci_dev)) 55fb145456SKleber Sacilotto de Souza return -EIO; 56fb145456SKleber Sacilotto de Souza 57a45a0258SFrank Haverkamp __raw_writeq((__force u64)cpu_to_be64(val), cd->mmio + byte_offs); 5867f4addbSFrank Haverkamp return 0; 5967f4addbSFrank Haverkamp } 6067f4addbSFrank Haverkamp 6167f4addbSFrank Haverkamp /** 6267f4addbSFrank Haverkamp * __genwqe_readq() - Read 64-bit register 6367f4addbSFrank Haverkamp * @cd: genwqe device descriptor 6467f4addbSFrank Haverkamp * @byte_offs: offset within BAR 6567f4addbSFrank Haverkamp * 6667f4addbSFrank Haverkamp * Return: value from register 6767f4addbSFrank Haverkamp */ 6867f4addbSFrank Haverkamp u64 __genwqe_readq(struct genwqe_dev *cd, u64 byte_offs) 6967f4addbSFrank Haverkamp { 7067f4addbSFrank Haverkamp if (cd->err_inject & GENWQE_INJECT_HARDWARE_FAILURE) 7167f4addbSFrank Haverkamp return 0xffffffffffffffffull; 7267f4addbSFrank Haverkamp 7367f4addbSFrank Haverkamp if ((cd->err_inject & GENWQE_INJECT_GFIR_FATAL) && 7467f4addbSFrank Haverkamp (byte_offs == IO_SLC_CFGREG_GFIR)) 7567f4addbSFrank Haverkamp return 0x000000000000ffffull; 7667f4addbSFrank Haverkamp 7767f4addbSFrank Haverkamp if ((cd->err_inject & GENWQE_INJECT_GFIR_INFO) && 7867f4addbSFrank Haverkamp (byte_offs == IO_SLC_CFGREG_GFIR)) 7967f4addbSFrank Haverkamp return 0x00000000ffff0000ull; 8067f4addbSFrank Haverkamp 8167f4addbSFrank Haverkamp if (cd->mmio == NULL) 8267f4addbSFrank Haverkamp return 0xffffffffffffffffull; 8367f4addbSFrank Haverkamp 8458d66ce7SFrank Haverkamp return be64_to_cpu((__force __be64)__raw_readq(cd->mmio + byte_offs)); 8567f4addbSFrank Haverkamp } 8667f4addbSFrank Haverkamp 8767f4addbSFrank Haverkamp /** 8867f4addbSFrank Haverkamp * __genwqe_writel() - Write 32-bit register 8967f4addbSFrank Haverkamp * @cd: genwqe device descriptor 9067f4addbSFrank Haverkamp * @byte_offs: byte offset within BAR 9167f4addbSFrank Haverkamp * @val: 32-bit value 9267f4addbSFrank Haverkamp * 9367f4addbSFrank Haverkamp * Return: 0 if success; < 0 if error 9467f4addbSFrank Haverkamp */ 9567f4addbSFrank Haverkamp int __genwqe_writel(struct genwqe_dev *cd, u64 byte_offs, u32 val) 9667f4addbSFrank Haverkamp { 97fb145456SKleber Sacilotto de Souza struct pci_dev *pci_dev = cd->pci_dev; 98fb145456SKleber Sacilotto de Souza 9967f4addbSFrank Haverkamp if (cd->err_inject & GENWQE_INJECT_HARDWARE_FAILURE) 10067f4addbSFrank Haverkamp return -EIO; 10167f4addbSFrank Haverkamp 10267f4addbSFrank Haverkamp if (cd->mmio == NULL) 10367f4addbSFrank Haverkamp return -EIO; 10467f4addbSFrank Haverkamp 105fb145456SKleber Sacilotto de Souza if (pci_channel_offline(pci_dev)) 106fb145456SKleber Sacilotto de Souza return -EIO; 107fb145456SKleber Sacilotto de Souza 10858d66ce7SFrank Haverkamp __raw_writel((__force u32)cpu_to_be32(val), cd->mmio + byte_offs); 10967f4addbSFrank Haverkamp return 0; 11067f4addbSFrank Haverkamp } 11167f4addbSFrank Haverkamp 11267f4addbSFrank Haverkamp /** 11367f4addbSFrank Haverkamp * __genwqe_readl() - Read 32-bit register 11467f4addbSFrank Haverkamp * @cd: genwqe device descriptor 11567f4addbSFrank Haverkamp * @byte_offs: offset within BAR 11667f4addbSFrank Haverkamp * 11767f4addbSFrank Haverkamp * Return: Value from register 11867f4addbSFrank Haverkamp */ 11967f4addbSFrank Haverkamp u32 __genwqe_readl(struct genwqe_dev *cd, u64 byte_offs) 12067f4addbSFrank Haverkamp { 12167f4addbSFrank Haverkamp if (cd->err_inject & GENWQE_INJECT_HARDWARE_FAILURE) 12267f4addbSFrank Haverkamp return 0xffffffff; 12367f4addbSFrank Haverkamp 12467f4addbSFrank Haverkamp if (cd->mmio == NULL) 12567f4addbSFrank Haverkamp return 0xffffffff; 12667f4addbSFrank Haverkamp 12758d66ce7SFrank Haverkamp return be32_to_cpu((__force __be32)__raw_readl(cd->mmio + byte_offs)); 12867f4addbSFrank Haverkamp } 12967f4addbSFrank Haverkamp 13067f4addbSFrank Haverkamp /** 13167f4addbSFrank Haverkamp * genwqe_read_app_id() - Extract app_id 13267f4addbSFrank Haverkamp * 13367f4addbSFrank Haverkamp * app_unitcfg need to be filled with valid data first 13467f4addbSFrank Haverkamp */ 13567f4addbSFrank Haverkamp int genwqe_read_app_id(struct genwqe_dev *cd, char *app_name, int len) 13667f4addbSFrank Haverkamp { 13767f4addbSFrank Haverkamp int i, j; 13867f4addbSFrank Haverkamp u32 app_id = (u32)cd->app_unitcfg; 13967f4addbSFrank Haverkamp 14067f4addbSFrank Haverkamp memset(app_name, 0, len); 14167f4addbSFrank Haverkamp for (i = 0, j = 0; j < min(len, 4); j++) { 14267f4addbSFrank Haverkamp char ch = (char)((app_id >> (24 - j*8)) & 0xff); 143d9c11d45SFrank Haverkamp 14467f4addbSFrank Haverkamp if (ch == ' ') 14567f4addbSFrank Haverkamp continue; 14667f4addbSFrank Haverkamp app_name[i++] = isprint(ch) ? ch : 'X'; 14767f4addbSFrank Haverkamp } 14867f4addbSFrank Haverkamp return i; 14967f4addbSFrank Haverkamp } 15067f4addbSFrank Haverkamp 15167f4addbSFrank Haverkamp /** 15267f4addbSFrank Haverkamp * genwqe_init_crc32() - Prepare a lookup table for fast crc32 calculations 15367f4addbSFrank Haverkamp * 15467f4addbSFrank Haverkamp * Existing kernel functions seem to use a different polynom, 15567f4addbSFrank Haverkamp * therefore we could not use them here. 15667f4addbSFrank Haverkamp * 15767f4addbSFrank Haverkamp * Genwqe's Polynomial = 0x20044009 15867f4addbSFrank Haverkamp */ 15967f4addbSFrank Haverkamp #define CRC32_POLYNOMIAL 0x20044009 16067f4addbSFrank Haverkamp static u32 crc32_tab[256]; /* crc32 lookup table */ 16167f4addbSFrank Haverkamp 16267f4addbSFrank Haverkamp void genwqe_init_crc32(void) 16367f4addbSFrank Haverkamp { 16467f4addbSFrank Haverkamp int i, j; 16567f4addbSFrank Haverkamp u32 crc; 16667f4addbSFrank Haverkamp 16767f4addbSFrank Haverkamp for (i = 0; i < 256; i++) { 16867f4addbSFrank Haverkamp crc = i << 24; 16967f4addbSFrank Haverkamp for (j = 0; j < 8; j++) { 17067f4addbSFrank Haverkamp if (crc & 0x80000000) 17167f4addbSFrank Haverkamp crc = (crc << 1) ^ CRC32_POLYNOMIAL; 17267f4addbSFrank Haverkamp else 17367f4addbSFrank Haverkamp crc = (crc << 1); 17467f4addbSFrank Haverkamp } 17567f4addbSFrank Haverkamp crc32_tab[i] = crc; 17667f4addbSFrank Haverkamp } 17767f4addbSFrank Haverkamp } 17867f4addbSFrank Haverkamp 17967f4addbSFrank Haverkamp /** 18067f4addbSFrank Haverkamp * genwqe_crc32() - Generate 32-bit crc as required for DDCBs 18167f4addbSFrank Haverkamp * @buff: pointer to data buffer 18267f4addbSFrank Haverkamp * @len: length of data for calculation 18367f4addbSFrank Haverkamp * @init: initial crc (0xffffffff at start) 18467f4addbSFrank Haverkamp * 18567f4addbSFrank Haverkamp * polynomial = x^32 * + x^29 + x^18 + x^14 + x^3 + 1 (0x20044009) 18667f4addbSFrank Haverkamp 18767f4addbSFrank Haverkamp * Example: 4 bytes 0x01 0x02 0x03 0x04 with init=0xffffffff should 18867f4addbSFrank Haverkamp * result in a crc32 of 0xf33cb7d3. 18967f4addbSFrank Haverkamp * 19067f4addbSFrank Haverkamp * The existing kernel crc functions did not cover this polynom yet. 19167f4addbSFrank Haverkamp * 19267f4addbSFrank Haverkamp * Return: crc32 checksum. 19367f4addbSFrank Haverkamp */ 19467f4addbSFrank Haverkamp u32 genwqe_crc32(u8 *buff, size_t len, u32 init) 19567f4addbSFrank Haverkamp { 19667f4addbSFrank Haverkamp int i; 19767f4addbSFrank Haverkamp u32 crc; 19867f4addbSFrank Haverkamp 19967f4addbSFrank Haverkamp crc = init; 20067f4addbSFrank Haverkamp while (len--) { 20167f4addbSFrank Haverkamp i = ((crc >> 24) ^ *buff++) & 0xFF; 20267f4addbSFrank Haverkamp crc = (crc << 8) ^ crc32_tab[i]; 20367f4addbSFrank Haverkamp } 20467f4addbSFrank Haverkamp return crc; 20567f4addbSFrank Haverkamp } 20667f4addbSFrank Haverkamp 20767f4addbSFrank Haverkamp void *__genwqe_alloc_consistent(struct genwqe_dev *cd, size_t size, 20867f4addbSFrank Haverkamp dma_addr_t *dma_handle) 20967f4addbSFrank Haverkamp { 210fdd66968SChristian Borntraeger if (get_order(size) >= MAX_ORDER) 21167f4addbSFrank Haverkamp return NULL; 21267f4addbSFrank Haverkamp 213750afb08SLuis Chamberlain return dma_alloc_coherent(&cd->pci_dev->dev, size, dma_handle, 21419f7767eSSebastian Ott GFP_KERNEL); 21567f4addbSFrank Haverkamp } 21667f4addbSFrank Haverkamp 21767f4addbSFrank Haverkamp void __genwqe_free_consistent(struct genwqe_dev *cd, size_t size, 21867f4addbSFrank Haverkamp void *vaddr, dma_addr_t dma_handle) 21967f4addbSFrank Haverkamp { 22067f4addbSFrank Haverkamp if (vaddr == NULL) 22167f4addbSFrank Haverkamp return; 22267f4addbSFrank Haverkamp 22319f7767eSSebastian Ott dma_free_coherent(&cd->pci_dev->dev, size, vaddr, dma_handle); 22467f4addbSFrank Haverkamp } 22567f4addbSFrank Haverkamp 22667f4addbSFrank Haverkamp static void genwqe_unmap_pages(struct genwqe_dev *cd, dma_addr_t *dma_list, 22767f4addbSFrank Haverkamp int num_pages) 22867f4addbSFrank Haverkamp { 22967f4addbSFrank Haverkamp int i; 23067f4addbSFrank Haverkamp struct pci_dev *pci_dev = cd->pci_dev; 23167f4addbSFrank Haverkamp 23267f4addbSFrank Haverkamp for (i = 0; (i < num_pages) && (dma_list[i] != 0x0); i++) { 23367f4addbSFrank Haverkamp pci_unmap_page(pci_dev, dma_list[i], 23467f4addbSFrank Haverkamp PAGE_SIZE, PCI_DMA_BIDIRECTIONAL); 23567f4addbSFrank Haverkamp dma_list[i] = 0x0; 23667f4addbSFrank Haverkamp } 23767f4addbSFrank Haverkamp } 23867f4addbSFrank Haverkamp 23967f4addbSFrank Haverkamp static int genwqe_map_pages(struct genwqe_dev *cd, 24067f4addbSFrank Haverkamp struct page **page_list, int num_pages, 24167f4addbSFrank Haverkamp dma_addr_t *dma_list) 24267f4addbSFrank Haverkamp { 24367f4addbSFrank Haverkamp int i; 24467f4addbSFrank Haverkamp struct pci_dev *pci_dev = cd->pci_dev; 24567f4addbSFrank Haverkamp 24667f4addbSFrank Haverkamp /* establish DMA mapping for requested pages */ 24767f4addbSFrank Haverkamp for (i = 0; i < num_pages; i++) { 24867f4addbSFrank Haverkamp dma_addr_t daddr; 24967f4addbSFrank Haverkamp 25067f4addbSFrank Haverkamp dma_list[i] = 0x0; 25167f4addbSFrank Haverkamp daddr = pci_map_page(pci_dev, page_list[i], 25267f4addbSFrank Haverkamp 0, /* map_offs */ 25367f4addbSFrank Haverkamp PAGE_SIZE, 25467f4addbSFrank Haverkamp PCI_DMA_BIDIRECTIONAL); /* FIXME rd/rw */ 25567f4addbSFrank Haverkamp 25667f4addbSFrank Haverkamp if (pci_dma_mapping_error(pci_dev, daddr)) { 25767f4addbSFrank Haverkamp dev_err(&pci_dev->dev, 25867f4addbSFrank Haverkamp "[%s] err: no dma addr daddr=%016llx!\n", 25967f4addbSFrank Haverkamp __func__, (long long)daddr); 26067f4addbSFrank Haverkamp goto err; 26167f4addbSFrank Haverkamp } 26267f4addbSFrank Haverkamp 26367f4addbSFrank Haverkamp dma_list[i] = daddr; 26467f4addbSFrank Haverkamp } 26567f4addbSFrank Haverkamp return 0; 26667f4addbSFrank Haverkamp 26767f4addbSFrank Haverkamp err: 26867f4addbSFrank Haverkamp genwqe_unmap_pages(cd, dma_list, num_pages); 26967f4addbSFrank Haverkamp return -EIO; 27067f4addbSFrank Haverkamp } 27167f4addbSFrank Haverkamp 27267f4addbSFrank Haverkamp static int genwqe_sgl_size(int num_pages) 27367f4addbSFrank Haverkamp { 27467f4addbSFrank Haverkamp int len, num_tlb = num_pages / 7; 27567f4addbSFrank Haverkamp 27667f4addbSFrank Haverkamp len = sizeof(struct sg_entry) * (num_pages+num_tlb + 1); 27767f4addbSFrank Haverkamp return roundup(len, PAGE_SIZE); 27867f4addbSFrank Haverkamp } 27967f4addbSFrank Haverkamp 280718f762eSFrank Haverkamp /** 281718f762eSFrank Haverkamp * genwqe_alloc_sync_sgl() - Allocate memory for sgl and overlapping pages 282718f762eSFrank Haverkamp * 283718f762eSFrank Haverkamp * Allocates memory for sgl and overlapping pages. Pages which might 284718f762eSFrank Haverkamp * overlap other user-space memory blocks are being cached for DMAs, 285718f762eSFrank Haverkamp * such that we do not run into syncronization issues. Data is copied 286718f762eSFrank Haverkamp * from user-space into the cached pages. 287718f762eSFrank Haverkamp */ 288718f762eSFrank Haverkamp int genwqe_alloc_sync_sgl(struct genwqe_dev *cd, struct genwqe_sgl *sgl, 289de4ce2d1SGuilherme G. Piccoli void __user *user_addr, size_t user_size, int write) 29067f4addbSFrank Haverkamp { 29102241995Szhong jiang int ret = -ENOMEM; 29267f4addbSFrank Haverkamp struct pci_dev *pci_dev = cd->pci_dev; 29367f4addbSFrank Haverkamp 294718f762eSFrank Haverkamp sgl->fpage_offs = offset_in_page((unsigned long)user_addr); 295718f762eSFrank Haverkamp sgl->fpage_size = min_t(size_t, PAGE_SIZE-sgl->fpage_offs, user_size); 296718f762eSFrank Haverkamp sgl->nr_pages = DIV_ROUND_UP(sgl->fpage_offs + user_size, PAGE_SIZE); 297718f762eSFrank Haverkamp sgl->lpage_size = (user_size - sgl->fpage_size) % PAGE_SIZE; 298718f762eSFrank Haverkamp 299d9c11d45SFrank Haverkamp dev_dbg(&pci_dev->dev, "[%s] uaddr=%p usize=%8ld nr_pages=%ld fpage_offs=%lx fpage_size=%ld lpage_size=%ld\n", 300718f762eSFrank Haverkamp __func__, user_addr, user_size, sgl->nr_pages, 301718f762eSFrank Haverkamp sgl->fpage_offs, sgl->fpage_size, sgl->lpage_size); 302718f762eSFrank Haverkamp 303718f762eSFrank Haverkamp sgl->user_addr = user_addr; 304718f762eSFrank Haverkamp sgl->user_size = user_size; 305de4ce2d1SGuilherme G. Piccoli sgl->write = write; 306718f762eSFrank Haverkamp sgl->sgl_size = genwqe_sgl_size(sgl->nr_pages); 307718f762eSFrank Haverkamp 308718f762eSFrank Haverkamp if (get_order(sgl->sgl_size) > MAX_ORDER) { 30967f4addbSFrank Haverkamp dev_err(&pci_dev->dev, 31067f4addbSFrank Haverkamp "[%s] err: too much memory requested!\n", __func__); 31102241995Szhong jiang return ret; 31267f4addbSFrank Haverkamp } 31367f4addbSFrank Haverkamp 314718f762eSFrank Haverkamp sgl->sgl = __genwqe_alloc_consistent(cd, sgl->sgl_size, 315718f762eSFrank Haverkamp &sgl->sgl_dma_addr); 316718f762eSFrank Haverkamp if (sgl->sgl == NULL) { 31767f4addbSFrank Haverkamp dev_err(&pci_dev->dev, 31867f4addbSFrank Haverkamp "[%s] err: no memory available!\n", __func__); 31902241995Szhong jiang return ret; 32067f4addbSFrank Haverkamp } 32167f4addbSFrank Haverkamp 322718f762eSFrank Haverkamp /* Only use buffering on incomplete pages */ 323718f762eSFrank Haverkamp if ((sgl->fpage_size != 0) && (sgl->fpage_size != PAGE_SIZE)) { 324718f762eSFrank Haverkamp sgl->fpage = __genwqe_alloc_consistent(cd, PAGE_SIZE, 325718f762eSFrank Haverkamp &sgl->fpage_dma_addr); 326718f762eSFrank Haverkamp if (sgl->fpage == NULL) 327718f762eSFrank Haverkamp goto err_out; 328718f762eSFrank Haverkamp 329718f762eSFrank Haverkamp /* Sync with user memory */ 330718f762eSFrank Haverkamp if (copy_from_user(sgl->fpage + sgl->fpage_offs, 331718f762eSFrank Haverkamp user_addr, sgl->fpage_size)) { 33202241995Szhong jiang ret = -EFAULT; 333718f762eSFrank Haverkamp goto err_out; 334718f762eSFrank Haverkamp } 335718f762eSFrank Haverkamp } 336718f762eSFrank Haverkamp if (sgl->lpage_size != 0) { 337718f762eSFrank Haverkamp sgl->lpage = __genwqe_alloc_consistent(cd, PAGE_SIZE, 338718f762eSFrank Haverkamp &sgl->lpage_dma_addr); 339718f762eSFrank Haverkamp if (sgl->lpage == NULL) 340718f762eSFrank Haverkamp goto err_out1; 341718f762eSFrank Haverkamp 342718f762eSFrank Haverkamp /* Sync with user memory */ 343718f762eSFrank Haverkamp if (copy_from_user(sgl->lpage, user_addr + user_size - 344718f762eSFrank Haverkamp sgl->lpage_size, sgl->lpage_size)) { 34502241995Szhong jiang ret = -EFAULT; 346a7a7aeefSGerald Schaefer goto err_out2; 347718f762eSFrank Haverkamp } 348718f762eSFrank Haverkamp } 349718f762eSFrank Haverkamp return 0; 350718f762eSFrank Haverkamp 351a7a7aeefSGerald Schaefer err_out2: 352a7a7aeefSGerald Schaefer __genwqe_free_consistent(cd, PAGE_SIZE, sgl->lpage, 353a7a7aeefSGerald Schaefer sgl->lpage_dma_addr); 354a7a7aeefSGerald Schaefer sgl->lpage = NULL; 355a7a7aeefSGerald Schaefer sgl->lpage_dma_addr = 0; 356718f762eSFrank Haverkamp err_out1: 357718f762eSFrank Haverkamp __genwqe_free_consistent(cd, PAGE_SIZE, sgl->fpage, 358718f762eSFrank Haverkamp sgl->fpage_dma_addr); 359a7a7aeefSGerald Schaefer sgl->fpage = NULL; 360a7a7aeefSGerald Schaefer sgl->fpage_dma_addr = 0; 361718f762eSFrank Haverkamp err_out: 362718f762eSFrank Haverkamp __genwqe_free_consistent(cd, sgl->sgl_size, sgl->sgl, 363718f762eSFrank Haverkamp sgl->sgl_dma_addr); 364a7a7aeefSGerald Schaefer sgl->sgl = NULL; 365a7a7aeefSGerald Schaefer sgl->sgl_dma_addr = 0; 366a7a7aeefSGerald Schaefer sgl->sgl_size = 0; 36702241995Szhong jiang 36802241995Szhong jiang return ret; 36967f4addbSFrank Haverkamp } 37067f4addbSFrank Haverkamp 371718f762eSFrank Haverkamp int genwqe_setup_sgl(struct genwqe_dev *cd, struct genwqe_sgl *sgl, 372718f762eSFrank Haverkamp dma_addr_t *dma_list) 37367f4addbSFrank Haverkamp { 37467f4addbSFrank Haverkamp int i = 0, j = 0, p; 37567f4addbSFrank Haverkamp unsigned long dma_offs, map_offs; 37667f4addbSFrank Haverkamp dma_addr_t prev_daddr = 0; 37767f4addbSFrank Haverkamp struct sg_entry *s, *last_s = NULL; 378718f762eSFrank Haverkamp size_t size = sgl->user_size; 37967f4addbSFrank Haverkamp 38067f4addbSFrank Haverkamp dma_offs = 128; /* next block if needed/dma_offset */ 381718f762eSFrank Haverkamp map_offs = sgl->fpage_offs; /* offset in first page */ 38267f4addbSFrank Haverkamp 383718f762eSFrank Haverkamp s = &sgl->sgl[0]; /* first set of 8 entries */ 38467f4addbSFrank Haverkamp p = 0; /* page */ 385718f762eSFrank Haverkamp while (p < sgl->nr_pages) { 38667f4addbSFrank Haverkamp dma_addr_t daddr; 38767f4addbSFrank Haverkamp unsigned int size_to_map; 38867f4addbSFrank Haverkamp 38967f4addbSFrank Haverkamp /* always write the chaining entry, cleanup is done later */ 39067f4addbSFrank Haverkamp j = 0; 391718f762eSFrank Haverkamp s[j].target_addr = cpu_to_be64(sgl->sgl_dma_addr + dma_offs); 39267f4addbSFrank Haverkamp s[j].len = cpu_to_be32(128); 39367f4addbSFrank Haverkamp s[j].flags = cpu_to_be32(SG_CHAINED); 39467f4addbSFrank Haverkamp j++; 39567f4addbSFrank Haverkamp 39667f4addbSFrank Haverkamp while (j < 8) { 39767f4addbSFrank Haverkamp /* DMA mapping for requested page, offs, size */ 39867f4addbSFrank Haverkamp size_to_map = min(size, PAGE_SIZE - map_offs); 399718f762eSFrank Haverkamp 400718f762eSFrank Haverkamp if ((p == 0) && (sgl->fpage != NULL)) { 401718f762eSFrank Haverkamp daddr = sgl->fpage_dma_addr + map_offs; 402718f762eSFrank Haverkamp 403718f762eSFrank Haverkamp } else if ((p == sgl->nr_pages - 1) && 404718f762eSFrank Haverkamp (sgl->lpage != NULL)) { 405718f762eSFrank Haverkamp daddr = sgl->lpage_dma_addr; 406718f762eSFrank Haverkamp } else { 407718f762eSFrank Haverkamp daddr = dma_list[p] + map_offs; 408718f762eSFrank Haverkamp } 409718f762eSFrank Haverkamp 41067f4addbSFrank Haverkamp size -= size_to_map; 41167f4addbSFrank Haverkamp map_offs = 0; 41267f4addbSFrank Haverkamp 41367f4addbSFrank Haverkamp if (prev_daddr == daddr) { 41467f4addbSFrank Haverkamp u32 prev_len = be32_to_cpu(last_s->len); 41567f4addbSFrank Haverkamp 41667f4addbSFrank Haverkamp /* pr_info("daddr combining: " 41767f4addbSFrank Haverkamp "%016llx/%08x -> %016llx\n", 41867f4addbSFrank Haverkamp prev_daddr, prev_len, daddr); */ 41967f4addbSFrank Haverkamp 42067f4addbSFrank Haverkamp last_s->len = cpu_to_be32(prev_len + 42167f4addbSFrank Haverkamp size_to_map); 42267f4addbSFrank Haverkamp 42367f4addbSFrank Haverkamp p++; /* process next page */ 424718f762eSFrank Haverkamp if (p == sgl->nr_pages) 42567f4addbSFrank Haverkamp goto fixup; /* nothing to do */ 42667f4addbSFrank Haverkamp 42767f4addbSFrank Haverkamp prev_daddr = daddr + size_to_map; 42867f4addbSFrank Haverkamp continue; 42967f4addbSFrank Haverkamp } 43067f4addbSFrank Haverkamp 43167f4addbSFrank Haverkamp /* start new entry */ 43267f4addbSFrank Haverkamp s[j].target_addr = cpu_to_be64(daddr); 43367f4addbSFrank Haverkamp s[j].len = cpu_to_be32(size_to_map); 43467f4addbSFrank Haverkamp s[j].flags = cpu_to_be32(SG_DATA); 43567f4addbSFrank Haverkamp prev_daddr = daddr + size_to_map; 43667f4addbSFrank Haverkamp last_s = &s[j]; 43767f4addbSFrank Haverkamp j++; 43867f4addbSFrank Haverkamp 43967f4addbSFrank Haverkamp p++; /* process next page */ 440718f762eSFrank Haverkamp if (p == sgl->nr_pages) 44167f4addbSFrank Haverkamp goto fixup; /* nothing to do */ 44267f4addbSFrank Haverkamp } 44367f4addbSFrank Haverkamp dma_offs += 128; 44467f4addbSFrank Haverkamp s += 8; /* continue 8 elements further */ 44567f4addbSFrank Haverkamp } 44667f4addbSFrank Haverkamp fixup: 4472f097267SMarkus Elfring if (j == 1) { /* combining happened on last entry! */ 44867f4addbSFrank Haverkamp s -= 8; /* full shift needed on previous sgl block */ 44967f4addbSFrank Haverkamp j = 7; /* shift all elements */ 45067f4addbSFrank Haverkamp } 45167f4addbSFrank Haverkamp 45267f4addbSFrank Haverkamp for (i = 0; i < j; i++) /* move elements 1 up */ 45367f4addbSFrank Haverkamp s[i] = s[i + 1]; 45467f4addbSFrank Haverkamp 45567f4addbSFrank Haverkamp s[i].target_addr = cpu_to_be64(0); 45667f4addbSFrank Haverkamp s[i].len = cpu_to_be32(0); 45767f4addbSFrank Haverkamp s[i].flags = cpu_to_be32(SG_END_LIST); 45867f4addbSFrank Haverkamp return 0; 45967f4addbSFrank Haverkamp } 46067f4addbSFrank Haverkamp 461718f762eSFrank Haverkamp /** 462718f762eSFrank Haverkamp * genwqe_free_sync_sgl() - Free memory for sgl and overlapping pages 463718f762eSFrank Haverkamp * 464718f762eSFrank Haverkamp * After the DMA transfer has been completed we free the memory for 4652f097267SMarkus Elfring * the sgl and the cached pages. Data is being transferred from cached 466718f762eSFrank Haverkamp * pages into user-space buffers. 467718f762eSFrank Haverkamp */ 468718f762eSFrank Haverkamp int genwqe_free_sync_sgl(struct genwqe_dev *cd, struct genwqe_sgl *sgl) 46967f4addbSFrank Haverkamp { 47063fa80cdSChristian Engelmayer int rc = 0; 471de4ce2d1SGuilherme G. Piccoli size_t offset; 472de4ce2d1SGuilherme G. Piccoli unsigned long res; 473718f762eSFrank Haverkamp struct pci_dev *pci_dev = cd->pci_dev; 474718f762eSFrank Haverkamp 475718f762eSFrank Haverkamp if (sgl->fpage) { 476de4ce2d1SGuilherme G. Piccoli if (sgl->write) { 477de4ce2d1SGuilherme G. Piccoli res = copy_to_user(sgl->user_addr, 478de4ce2d1SGuilherme G. Piccoli sgl->fpage + sgl->fpage_offs, sgl->fpage_size); 479de4ce2d1SGuilherme G. Piccoli if (res) { 480de4ce2d1SGuilherme G. Piccoli dev_err(&pci_dev->dev, 481de4ce2d1SGuilherme G. Piccoli "[%s] err: copying fpage! (res=%lu)\n", 482de4ce2d1SGuilherme G. Piccoli __func__, res); 483718f762eSFrank Haverkamp rc = -EFAULT; 484718f762eSFrank Haverkamp } 485de4ce2d1SGuilherme G. Piccoli } 486718f762eSFrank Haverkamp __genwqe_free_consistent(cd, PAGE_SIZE, sgl->fpage, 487718f762eSFrank Haverkamp sgl->fpage_dma_addr); 488718f762eSFrank Haverkamp sgl->fpage = NULL; 489718f762eSFrank Haverkamp sgl->fpage_dma_addr = 0; 490718f762eSFrank Haverkamp } 491718f762eSFrank Haverkamp if (sgl->lpage) { 492de4ce2d1SGuilherme G. Piccoli if (sgl->write) { 493de4ce2d1SGuilherme G. Piccoli offset = sgl->user_size - sgl->lpage_size; 494de4ce2d1SGuilherme G. Piccoli res = copy_to_user(sgl->user_addr + offset, sgl->lpage, 495de4ce2d1SGuilherme G. Piccoli sgl->lpage_size); 496de4ce2d1SGuilherme G. Piccoli if (res) { 497de4ce2d1SGuilherme G. Piccoli dev_err(&pci_dev->dev, 498de4ce2d1SGuilherme G. Piccoli "[%s] err: copying lpage! (res=%lu)\n", 499de4ce2d1SGuilherme G. Piccoli __func__, res); 500718f762eSFrank Haverkamp rc = -EFAULT; 501718f762eSFrank Haverkamp } 502de4ce2d1SGuilherme G. Piccoli } 503718f762eSFrank Haverkamp __genwqe_free_consistent(cd, PAGE_SIZE, sgl->lpage, 504718f762eSFrank Haverkamp sgl->lpage_dma_addr); 505718f762eSFrank Haverkamp sgl->lpage = NULL; 506718f762eSFrank Haverkamp sgl->lpage_dma_addr = 0; 507718f762eSFrank Haverkamp } 508718f762eSFrank Haverkamp __genwqe_free_consistent(cd, sgl->sgl_size, sgl->sgl, 509718f762eSFrank Haverkamp sgl->sgl_dma_addr); 510718f762eSFrank Haverkamp 511718f762eSFrank Haverkamp sgl->sgl = NULL; 512718f762eSFrank Haverkamp sgl->sgl_dma_addr = 0x0; 513718f762eSFrank Haverkamp sgl->sgl_size = 0; 514718f762eSFrank Haverkamp return rc; 51567f4addbSFrank Haverkamp } 51667f4addbSFrank Haverkamp 51767f4addbSFrank Haverkamp /** 51867f4addbSFrank Haverkamp * genwqe_user_vmap() - Map user-space memory to virtual kernel memory 51967f4addbSFrank Haverkamp * @cd: pointer to genwqe device 52067f4addbSFrank Haverkamp * @m: mapping params 52167f4addbSFrank Haverkamp * @uaddr: user virtual address 52267f4addbSFrank Haverkamp * @size: size of memory to be mapped 52367f4addbSFrank Haverkamp * 52467f4addbSFrank Haverkamp * We need to think about how we could speed this up. Of course it is 52567f4addbSFrank Haverkamp * not a good idea to do this over and over again, like we are 52667f4addbSFrank Haverkamp * currently doing it. Nevertheless, I am curious where on the path 52767f4addbSFrank Haverkamp * the performance is spend. Most probably within the memory 52867f4addbSFrank Haverkamp * allocation functions, but maybe also in the DMA mapping code. 52967f4addbSFrank Haverkamp * 53067f4addbSFrank Haverkamp * Restrictions: The maximum size of the possible mapping currently depends 53167f4addbSFrank Haverkamp * on the amount of memory we can get using kzalloc() for the 53267f4addbSFrank Haverkamp * page_list and pci_alloc_consistent for the sg_list. 53367f4addbSFrank Haverkamp * The sg_list is currently itself not scattered, which could 53467f4addbSFrank Haverkamp * be fixed with some effort. The page_list must be split into 53567f4addbSFrank Haverkamp * PAGE_SIZE chunks too. All that will make the complicated 53667f4addbSFrank Haverkamp * code more complicated. 53767f4addbSFrank Haverkamp * 53867f4addbSFrank Haverkamp * Return: 0 if success 53967f4addbSFrank Haverkamp */ 54067f4addbSFrank Haverkamp int genwqe_user_vmap(struct genwqe_dev *cd, struct dma_mapping *m, void *uaddr, 541658a494aSGuilherme G. Piccoli unsigned long size) 54267f4addbSFrank Haverkamp { 54367f4addbSFrank Haverkamp int rc = -EINVAL; 54467f4addbSFrank Haverkamp unsigned long data, offs; 54567f4addbSFrank Haverkamp struct pci_dev *pci_dev = cd->pci_dev; 54667f4addbSFrank Haverkamp 54767f4addbSFrank Haverkamp if ((uaddr == NULL) || (size == 0)) { 54867f4addbSFrank Haverkamp m->size = 0; /* mark unused and not added */ 54967f4addbSFrank Haverkamp return -EINVAL; 55067f4addbSFrank Haverkamp } 55167f4addbSFrank Haverkamp m->u_vaddr = uaddr; 55267f4addbSFrank Haverkamp m->size = size; 55367f4addbSFrank Haverkamp 55467f4addbSFrank Haverkamp /* determine space needed for page_list. */ 55567f4addbSFrank Haverkamp data = (unsigned long)uaddr; 55667f4addbSFrank Haverkamp offs = offset_in_page(data); 557110080ceSDan Carpenter if (size > ULONG_MAX - PAGE_SIZE - offs) { 558110080ceSDan Carpenter m->size = 0; /* mark unused and not added */ 559110080ceSDan Carpenter return -EINVAL; 560110080ceSDan Carpenter } 56167f4addbSFrank Haverkamp m->nr_pages = DIV_ROUND_UP(offs + size, PAGE_SIZE); 56267f4addbSFrank Haverkamp 56367f4addbSFrank Haverkamp m->page_list = kcalloc(m->nr_pages, 56467f4addbSFrank Haverkamp sizeof(struct page *) + sizeof(dma_addr_t), 56567f4addbSFrank Haverkamp GFP_KERNEL); 56667f4addbSFrank Haverkamp if (!m->page_list) { 56767f4addbSFrank Haverkamp dev_err(&pci_dev->dev, "err: alloc page_list failed\n"); 56867f4addbSFrank Haverkamp m->nr_pages = 0; 56967f4addbSFrank Haverkamp m->u_vaddr = NULL; 57067f4addbSFrank Haverkamp m->size = 0; /* mark unused and not added */ 57167f4addbSFrank Haverkamp return -ENOMEM; 57267f4addbSFrank Haverkamp } 57367f4addbSFrank Haverkamp m->dma_list = (dma_addr_t *)(m->page_list + m->nr_pages); 57467f4addbSFrank Haverkamp 57567f4addbSFrank Haverkamp /* pin user pages in memory */ 576*ddae1423SJohn Hubbard rc = pin_user_pages_fast(data & PAGE_MASK, /* page aligned addr */ 57767f4addbSFrank Haverkamp m->nr_pages, 57873b0140bSIra Weiny m->write ? FOLL_WRITE : 0, /* readable/writable */ 57967f4addbSFrank Haverkamp m->page_list); /* ptrs to pages */ 580cf35d6e0SIan Abbott if (rc < 0) 581*ddae1423SJohn Hubbard goto fail_pin_user_pages; 58267f4addbSFrank Haverkamp 583*ddae1423SJohn Hubbard /* assumption: pin_user_pages can be killed by signals. */ 58467f4addbSFrank Haverkamp if (rc < m->nr_pages) { 585*ddae1423SJohn Hubbard unpin_user_pages_dirty_lock(m->page_list, rc, m->write); 58667f4addbSFrank Haverkamp rc = -EFAULT; 587*ddae1423SJohn Hubbard goto fail_pin_user_pages; 58867f4addbSFrank Haverkamp } 58967f4addbSFrank Haverkamp 59067f4addbSFrank Haverkamp rc = genwqe_map_pages(cd, m->page_list, m->nr_pages, m->dma_list); 59167f4addbSFrank Haverkamp if (rc != 0) 59267f4addbSFrank Haverkamp goto fail_free_user_pages; 59367f4addbSFrank Haverkamp 59467f4addbSFrank Haverkamp return 0; 59567f4addbSFrank Haverkamp 59667f4addbSFrank Haverkamp fail_free_user_pages: 597*ddae1423SJohn Hubbard unpin_user_pages_dirty_lock(m->page_list, m->nr_pages, m->write); 59867f4addbSFrank Haverkamp 599*ddae1423SJohn Hubbard fail_pin_user_pages: 60067f4addbSFrank Haverkamp kfree(m->page_list); 60167f4addbSFrank Haverkamp m->page_list = NULL; 60267f4addbSFrank Haverkamp m->dma_list = NULL; 60367f4addbSFrank Haverkamp m->nr_pages = 0; 60467f4addbSFrank Haverkamp m->u_vaddr = NULL; 60567f4addbSFrank Haverkamp m->size = 0; /* mark unused and not added */ 60667f4addbSFrank Haverkamp return rc; 60767f4addbSFrank Haverkamp } 60867f4addbSFrank Haverkamp 60967f4addbSFrank Haverkamp /** 61067f4addbSFrank Haverkamp * genwqe_user_vunmap() - Undo mapping of user-space mem to virtual kernel 61167f4addbSFrank Haverkamp * memory 61267f4addbSFrank Haverkamp * @cd: pointer to genwqe device 61367f4addbSFrank Haverkamp * @m: mapping params 61467f4addbSFrank Haverkamp */ 615658a494aSGuilherme G. Piccoli int genwqe_user_vunmap(struct genwqe_dev *cd, struct dma_mapping *m) 61667f4addbSFrank Haverkamp { 61767f4addbSFrank Haverkamp struct pci_dev *pci_dev = cd->pci_dev; 61867f4addbSFrank Haverkamp 61967f4addbSFrank Haverkamp if (!dma_mapping_used(m)) { 62067f4addbSFrank Haverkamp dev_err(&pci_dev->dev, "[%s] err: mapping %p not used!\n", 62167f4addbSFrank Haverkamp __func__, m); 62267f4addbSFrank Haverkamp return -EINVAL; 62367f4addbSFrank Haverkamp } 62467f4addbSFrank Haverkamp 62567f4addbSFrank Haverkamp if (m->dma_list) 62667f4addbSFrank Haverkamp genwqe_unmap_pages(cd, m->dma_list, m->nr_pages); 62767f4addbSFrank Haverkamp 62867f4addbSFrank Haverkamp if (m->page_list) { 629*ddae1423SJohn Hubbard unpin_user_pages_dirty_lock(m->page_list, m->nr_pages, 630*ddae1423SJohn Hubbard m->write); 63167f4addbSFrank Haverkamp kfree(m->page_list); 63267f4addbSFrank Haverkamp m->page_list = NULL; 63367f4addbSFrank Haverkamp m->dma_list = NULL; 63467f4addbSFrank Haverkamp m->nr_pages = 0; 63567f4addbSFrank Haverkamp } 63667f4addbSFrank Haverkamp 63767f4addbSFrank Haverkamp m->u_vaddr = NULL; 63867f4addbSFrank Haverkamp m->size = 0; /* mark as unused and not added */ 63967f4addbSFrank Haverkamp return 0; 64067f4addbSFrank Haverkamp } 64167f4addbSFrank Haverkamp 64267f4addbSFrank Haverkamp /** 64367f4addbSFrank Haverkamp * genwqe_card_type() - Get chip type SLU Configuration Register 64467f4addbSFrank Haverkamp * @cd: pointer to the genwqe device descriptor 64567f4addbSFrank Haverkamp * Return: 0: Altera Stratix-IV 230 64667f4addbSFrank Haverkamp * 1: Altera Stratix-IV 530 64767f4addbSFrank Haverkamp * 2: Altera Stratix-V A4 64867f4addbSFrank Haverkamp * 3: Altera Stratix-V A7 64967f4addbSFrank Haverkamp */ 65067f4addbSFrank Haverkamp u8 genwqe_card_type(struct genwqe_dev *cd) 65167f4addbSFrank Haverkamp { 65267f4addbSFrank Haverkamp u64 card_type = cd->slu_unitcfg; 653d9c11d45SFrank Haverkamp 65467f4addbSFrank Haverkamp return (u8)((card_type & IO_SLU_UNITCFG_TYPE_MASK) >> 20); 65567f4addbSFrank Haverkamp } 65667f4addbSFrank Haverkamp 65767f4addbSFrank Haverkamp /** 65867f4addbSFrank Haverkamp * genwqe_card_reset() - Reset the card 65967f4addbSFrank Haverkamp * @cd: pointer to the genwqe device descriptor 66067f4addbSFrank Haverkamp */ 66167f4addbSFrank Haverkamp int genwqe_card_reset(struct genwqe_dev *cd) 66267f4addbSFrank Haverkamp { 66367f4addbSFrank Haverkamp u64 softrst; 66467f4addbSFrank Haverkamp struct pci_dev *pci_dev = cd->pci_dev; 66567f4addbSFrank Haverkamp 66667f4addbSFrank Haverkamp if (!genwqe_is_privileged(cd)) 66767f4addbSFrank Haverkamp return -ENODEV; 66867f4addbSFrank Haverkamp 66967f4addbSFrank Haverkamp /* new SL */ 67067f4addbSFrank Haverkamp __genwqe_writeq(cd, IO_SLC_CFGREG_SOFTRESET, 0x1ull); 67167f4addbSFrank Haverkamp msleep(1000); 67267f4addbSFrank Haverkamp __genwqe_readq(cd, IO_HSU_FIR_CLR); 67367f4addbSFrank Haverkamp __genwqe_readq(cd, IO_APP_FIR_CLR); 67467f4addbSFrank Haverkamp __genwqe_readq(cd, IO_SLU_FIR_CLR); 67567f4addbSFrank Haverkamp 67667f4addbSFrank Haverkamp /* 67767f4addbSFrank Haverkamp * Read-modify-write to preserve the stealth bits 67867f4addbSFrank Haverkamp * 67967f4addbSFrank Haverkamp * For SL >= 039, Stealth WE bit allows removing 68067f4addbSFrank Haverkamp * the read-modify-wrote. 68167f4addbSFrank Haverkamp * r-m-w may require a mask 0x3C to avoid hitting hard 68267f4addbSFrank Haverkamp * reset again for error reset (should be 0, chicken). 68367f4addbSFrank Haverkamp */ 68467f4addbSFrank Haverkamp softrst = __genwqe_readq(cd, IO_SLC_CFGREG_SOFTRESET) & 0x3cull; 68567f4addbSFrank Haverkamp __genwqe_writeq(cd, IO_SLC_CFGREG_SOFTRESET, softrst | 0x2ull); 68667f4addbSFrank Haverkamp 68767f4addbSFrank Haverkamp /* give ERRORRESET some time to finish */ 68867f4addbSFrank Haverkamp msleep(50); 68967f4addbSFrank Haverkamp 69067f4addbSFrank Haverkamp if (genwqe_need_err_masking(cd)) { 69167f4addbSFrank Haverkamp dev_info(&pci_dev->dev, 69267f4addbSFrank Haverkamp "[%s] masking errors for old bitstreams\n", __func__); 69367f4addbSFrank Haverkamp __genwqe_writeq(cd, IO_SLC_MISC_DEBUG, 0x0aull); 69467f4addbSFrank Haverkamp } 69567f4addbSFrank Haverkamp return 0; 69667f4addbSFrank Haverkamp } 69767f4addbSFrank Haverkamp 69867f4addbSFrank Haverkamp int genwqe_read_softreset(struct genwqe_dev *cd) 69967f4addbSFrank Haverkamp { 70067f4addbSFrank Haverkamp u64 bitstream; 70167f4addbSFrank Haverkamp 70267f4addbSFrank Haverkamp if (!genwqe_is_privileged(cd)) 70367f4addbSFrank Haverkamp return -ENODEV; 70467f4addbSFrank Haverkamp 70567f4addbSFrank Haverkamp bitstream = __genwqe_readq(cd, IO_SLU_BITSTREAM) & 0x1; 70667f4addbSFrank Haverkamp cd->softreset = (bitstream == 0) ? 0x8ull : 0xcull; 70767f4addbSFrank Haverkamp return 0; 70867f4addbSFrank Haverkamp } 70967f4addbSFrank Haverkamp 71067f4addbSFrank Haverkamp /** 71167f4addbSFrank Haverkamp * genwqe_set_interrupt_capability() - Configure MSI capability structure 71267f4addbSFrank Haverkamp * @cd: pointer to the device 71367f4addbSFrank Haverkamp * Return: 0 if no error 71467f4addbSFrank Haverkamp */ 71567f4addbSFrank Haverkamp int genwqe_set_interrupt_capability(struct genwqe_dev *cd, int count) 71667f4addbSFrank Haverkamp { 71767f4addbSFrank Haverkamp int rc; 71867f4addbSFrank Haverkamp 719d3f45647SChristoph Hellwig rc = pci_alloc_irq_vectors(cd->pci_dev, 1, count, PCI_IRQ_MSI); 7207276883fSSebastian Ott if (rc < 0) 72167f4addbSFrank Haverkamp return rc; 7227276883fSSebastian Ott return 0; 72367f4addbSFrank Haverkamp } 72467f4addbSFrank Haverkamp 72567f4addbSFrank Haverkamp /** 72667f4addbSFrank Haverkamp * genwqe_reset_interrupt_capability() - Undo genwqe_set_interrupt_capability() 72767f4addbSFrank Haverkamp * @cd: pointer to the device 72867f4addbSFrank Haverkamp */ 72967f4addbSFrank Haverkamp void genwqe_reset_interrupt_capability(struct genwqe_dev *cd) 73067f4addbSFrank Haverkamp { 731d3f45647SChristoph Hellwig pci_free_irq_vectors(cd->pci_dev); 73267f4addbSFrank Haverkamp } 73367f4addbSFrank Haverkamp 73467f4addbSFrank Haverkamp /** 73567f4addbSFrank Haverkamp * set_reg_idx() - Fill array with data. Ignore illegal offsets. 73667f4addbSFrank Haverkamp * @cd: card device 73767f4addbSFrank Haverkamp * @r: debug register array 73867f4addbSFrank Haverkamp * @i: index to desired entry 73967f4addbSFrank Haverkamp * @m: maximum possible entries 74067f4addbSFrank Haverkamp * @addr: addr which is read 74167f4addbSFrank Haverkamp * @index: index in debug array 74267f4addbSFrank Haverkamp * @val: read value 74367f4addbSFrank Haverkamp */ 74467f4addbSFrank Haverkamp static int set_reg_idx(struct genwqe_dev *cd, struct genwqe_reg *r, 74567f4addbSFrank Haverkamp unsigned int *i, unsigned int m, u32 addr, u32 idx, 74667f4addbSFrank Haverkamp u64 val) 74767f4addbSFrank Haverkamp { 74867f4addbSFrank Haverkamp if (WARN_ON_ONCE(*i >= m)) 74967f4addbSFrank Haverkamp return -EFAULT; 75067f4addbSFrank Haverkamp 75167f4addbSFrank Haverkamp r[*i].addr = addr; 75267f4addbSFrank Haverkamp r[*i].idx = idx; 75367f4addbSFrank Haverkamp r[*i].val = val; 75467f4addbSFrank Haverkamp ++*i; 75567f4addbSFrank Haverkamp return 0; 75667f4addbSFrank Haverkamp } 75767f4addbSFrank Haverkamp 75867f4addbSFrank Haverkamp static int set_reg(struct genwqe_dev *cd, struct genwqe_reg *r, 75967f4addbSFrank Haverkamp unsigned int *i, unsigned int m, u32 addr, u64 val) 76067f4addbSFrank Haverkamp { 76167f4addbSFrank Haverkamp return set_reg_idx(cd, r, i, m, addr, 0, val); 76267f4addbSFrank Haverkamp } 76367f4addbSFrank Haverkamp 76467f4addbSFrank Haverkamp int genwqe_read_ffdc_regs(struct genwqe_dev *cd, struct genwqe_reg *regs, 76567f4addbSFrank Haverkamp unsigned int max_regs, int all) 76667f4addbSFrank Haverkamp { 76767f4addbSFrank Haverkamp unsigned int i, j, idx = 0; 76867f4addbSFrank Haverkamp u32 ufir_addr, ufec_addr, sfir_addr, sfec_addr; 76967f4addbSFrank Haverkamp u64 gfir, sluid, appid, ufir, ufec, sfir, sfec; 77067f4addbSFrank Haverkamp 77167f4addbSFrank Haverkamp /* Global FIR */ 77267f4addbSFrank Haverkamp gfir = __genwqe_readq(cd, IO_SLC_CFGREG_GFIR); 77367f4addbSFrank Haverkamp set_reg(cd, regs, &idx, max_regs, IO_SLC_CFGREG_GFIR, gfir); 77467f4addbSFrank Haverkamp 77567f4addbSFrank Haverkamp /* UnitCfg for SLU */ 77667f4addbSFrank Haverkamp sluid = __genwqe_readq(cd, IO_SLU_UNITCFG); /* 0x00000000 */ 77767f4addbSFrank Haverkamp set_reg(cd, regs, &idx, max_regs, IO_SLU_UNITCFG, sluid); 77867f4addbSFrank Haverkamp 77967f4addbSFrank Haverkamp /* UnitCfg for APP */ 78067f4addbSFrank Haverkamp appid = __genwqe_readq(cd, IO_APP_UNITCFG); /* 0x02000000 */ 78167f4addbSFrank Haverkamp set_reg(cd, regs, &idx, max_regs, IO_APP_UNITCFG, appid); 78267f4addbSFrank Haverkamp 78367f4addbSFrank Haverkamp /* Check all chip Units */ 78467f4addbSFrank Haverkamp for (i = 0; i < GENWQE_MAX_UNITS; i++) { 78567f4addbSFrank Haverkamp 78667f4addbSFrank Haverkamp /* Unit FIR */ 78767f4addbSFrank Haverkamp ufir_addr = (i << 24) | 0x008; 78867f4addbSFrank Haverkamp ufir = __genwqe_readq(cd, ufir_addr); 78967f4addbSFrank Haverkamp set_reg(cd, regs, &idx, max_regs, ufir_addr, ufir); 79067f4addbSFrank Haverkamp 79167f4addbSFrank Haverkamp /* Unit FEC */ 79267f4addbSFrank Haverkamp ufec_addr = (i << 24) | 0x018; 79367f4addbSFrank Haverkamp ufec = __genwqe_readq(cd, ufec_addr); 79467f4addbSFrank Haverkamp set_reg(cd, regs, &idx, max_regs, ufec_addr, ufec); 79567f4addbSFrank Haverkamp 79667f4addbSFrank Haverkamp for (j = 0; j < 64; j++) { 79767f4addbSFrank Haverkamp /* wherever there is a primary 1, read the 2ndary */ 79867f4addbSFrank Haverkamp if (!all && (!(ufir & (1ull << j)))) 79967f4addbSFrank Haverkamp continue; 80067f4addbSFrank Haverkamp 80167f4addbSFrank Haverkamp sfir_addr = (i << 24) | (0x100 + 8 * j); 80267f4addbSFrank Haverkamp sfir = __genwqe_readq(cd, sfir_addr); 80367f4addbSFrank Haverkamp set_reg(cd, regs, &idx, max_regs, sfir_addr, sfir); 80467f4addbSFrank Haverkamp 80567f4addbSFrank Haverkamp sfec_addr = (i << 24) | (0x300 + 8 * j); 80667f4addbSFrank Haverkamp sfec = __genwqe_readq(cd, sfec_addr); 80767f4addbSFrank Haverkamp set_reg(cd, regs, &idx, max_regs, sfec_addr, sfec); 80867f4addbSFrank Haverkamp } 80967f4addbSFrank Haverkamp } 81067f4addbSFrank Haverkamp 81167f4addbSFrank Haverkamp /* fill with invalid data until end */ 81267f4addbSFrank Haverkamp for (i = idx; i < max_regs; i++) { 81367f4addbSFrank Haverkamp regs[i].addr = 0xffffffff; 81467f4addbSFrank Haverkamp regs[i].val = 0xffffffffffffffffull; 81567f4addbSFrank Haverkamp } 81667f4addbSFrank Haverkamp return idx; 81767f4addbSFrank Haverkamp } 81867f4addbSFrank Haverkamp 81967f4addbSFrank Haverkamp /** 82067f4addbSFrank Haverkamp * genwqe_ffdc_buff_size() - Calculates the number of dump registers 82167f4addbSFrank Haverkamp */ 82267f4addbSFrank Haverkamp int genwqe_ffdc_buff_size(struct genwqe_dev *cd, int uid) 82367f4addbSFrank Haverkamp { 82467f4addbSFrank Haverkamp int entries = 0, ring, traps, traces, trace_entries; 82567f4addbSFrank Haverkamp u32 eevptr_addr, l_addr, d_len, d_type; 82667f4addbSFrank Haverkamp u64 eevptr, val, addr; 82767f4addbSFrank Haverkamp 82867f4addbSFrank Haverkamp eevptr_addr = GENWQE_UID_OFFS(uid) | IO_EXTENDED_ERROR_POINTER; 82967f4addbSFrank Haverkamp eevptr = __genwqe_readq(cd, eevptr_addr); 83067f4addbSFrank Haverkamp 83167f4addbSFrank Haverkamp if ((eevptr != 0x0) && (eevptr != -1ull)) { 83267f4addbSFrank Haverkamp l_addr = GENWQE_UID_OFFS(uid) | eevptr; 83367f4addbSFrank Haverkamp 83467f4addbSFrank Haverkamp while (1) { 83567f4addbSFrank Haverkamp val = __genwqe_readq(cd, l_addr); 83667f4addbSFrank Haverkamp 83767f4addbSFrank Haverkamp if ((val == 0x0) || (val == -1ull)) 83867f4addbSFrank Haverkamp break; 83967f4addbSFrank Haverkamp 84067f4addbSFrank Haverkamp /* 38:24 */ 84167f4addbSFrank Haverkamp d_len = (val & 0x0000007fff000000ull) >> 24; 84267f4addbSFrank Haverkamp 84367f4addbSFrank Haverkamp /* 39 */ 84467f4addbSFrank Haverkamp d_type = (val & 0x0000008000000000ull) >> 36; 84567f4addbSFrank Haverkamp 84667f4addbSFrank Haverkamp if (d_type) { /* repeat */ 84767f4addbSFrank Haverkamp entries += d_len; 84867f4addbSFrank Haverkamp } else { /* size in bytes! */ 84967f4addbSFrank Haverkamp entries += d_len >> 3; 85067f4addbSFrank Haverkamp } 85167f4addbSFrank Haverkamp 85267f4addbSFrank Haverkamp l_addr += 8; 85367f4addbSFrank Haverkamp } 85467f4addbSFrank Haverkamp } 85567f4addbSFrank Haverkamp 85667f4addbSFrank Haverkamp for (ring = 0; ring < 8; ring++) { 85767f4addbSFrank Haverkamp addr = GENWQE_UID_OFFS(uid) | IO_EXTENDED_DIAG_MAP(ring); 85867f4addbSFrank Haverkamp val = __genwqe_readq(cd, addr); 85967f4addbSFrank Haverkamp 86067f4addbSFrank Haverkamp if ((val == 0x0ull) || (val == -1ull)) 86167f4addbSFrank Haverkamp continue; 86267f4addbSFrank Haverkamp 86367f4addbSFrank Haverkamp traps = (val >> 24) & 0xff; 86467f4addbSFrank Haverkamp traces = (val >> 16) & 0xff; 86567f4addbSFrank Haverkamp trace_entries = val & 0xffff; 86667f4addbSFrank Haverkamp 86767f4addbSFrank Haverkamp entries += traps + (traces * trace_entries); 86867f4addbSFrank Haverkamp } 86967f4addbSFrank Haverkamp return entries; 87067f4addbSFrank Haverkamp } 87167f4addbSFrank Haverkamp 87267f4addbSFrank Haverkamp /** 87367f4addbSFrank Haverkamp * genwqe_ffdc_buff_read() - Implements LogoutExtendedErrorRegisters procedure 87467f4addbSFrank Haverkamp */ 87567f4addbSFrank Haverkamp int genwqe_ffdc_buff_read(struct genwqe_dev *cd, int uid, 87667f4addbSFrank Haverkamp struct genwqe_reg *regs, unsigned int max_regs) 87767f4addbSFrank Haverkamp { 87867f4addbSFrank Haverkamp int i, traps, traces, trace, trace_entries, trace_entry, ring; 87967f4addbSFrank Haverkamp unsigned int idx = 0; 88067f4addbSFrank Haverkamp u32 eevptr_addr, l_addr, d_addr, d_len, d_type; 88167f4addbSFrank Haverkamp u64 eevptr, e, val, addr; 88267f4addbSFrank Haverkamp 88367f4addbSFrank Haverkamp eevptr_addr = GENWQE_UID_OFFS(uid) | IO_EXTENDED_ERROR_POINTER; 88467f4addbSFrank Haverkamp eevptr = __genwqe_readq(cd, eevptr_addr); 88567f4addbSFrank Haverkamp 88667f4addbSFrank Haverkamp if ((eevptr != 0x0) && (eevptr != 0xffffffffffffffffull)) { 88767f4addbSFrank Haverkamp l_addr = GENWQE_UID_OFFS(uid) | eevptr; 88867f4addbSFrank Haverkamp while (1) { 88967f4addbSFrank Haverkamp e = __genwqe_readq(cd, l_addr); 89067f4addbSFrank Haverkamp if ((e == 0x0) || (e == 0xffffffffffffffffull)) 89167f4addbSFrank Haverkamp break; 89267f4addbSFrank Haverkamp 89367f4addbSFrank Haverkamp d_addr = (e & 0x0000000000ffffffull); /* 23:0 */ 89467f4addbSFrank Haverkamp d_len = (e & 0x0000007fff000000ull) >> 24; /* 38:24 */ 89567f4addbSFrank Haverkamp d_type = (e & 0x0000008000000000ull) >> 36; /* 39 */ 89667f4addbSFrank Haverkamp d_addr |= GENWQE_UID_OFFS(uid); 89767f4addbSFrank Haverkamp 89867f4addbSFrank Haverkamp if (d_type) { 89967f4addbSFrank Haverkamp for (i = 0; i < (int)d_len; i++) { 90067f4addbSFrank Haverkamp val = __genwqe_readq(cd, d_addr); 90167f4addbSFrank Haverkamp set_reg_idx(cd, regs, &idx, max_regs, 90267f4addbSFrank Haverkamp d_addr, i, val); 90367f4addbSFrank Haverkamp } 90467f4addbSFrank Haverkamp } else { 90567f4addbSFrank Haverkamp d_len >>= 3; /* Size in bytes! */ 90667f4addbSFrank Haverkamp for (i = 0; i < (int)d_len; i++, d_addr += 8) { 90767f4addbSFrank Haverkamp val = __genwqe_readq(cd, d_addr); 90867f4addbSFrank Haverkamp set_reg_idx(cd, regs, &idx, max_regs, 90967f4addbSFrank Haverkamp d_addr, 0, val); 91067f4addbSFrank Haverkamp } 91167f4addbSFrank Haverkamp } 91267f4addbSFrank Haverkamp l_addr += 8; 91367f4addbSFrank Haverkamp } 91467f4addbSFrank Haverkamp } 91567f4addbSFrank Haverkamp 91667f4addbSFrank Haverkamp /* 91767f4addbSFrank Haverkamp * To save time, there are only 6 traces poplulated on Uid=2, 91867f4addbSFrank Haverkamp * Ring=1. each with iters=512. 91967f4addbSFrank Haverkamp */ 92067f4addbSFrank Haverkamp for (ring = 0; ring < 8; ring++) { /* 0 is fls, 1 is fds, 92167f4addbSFrank Haverkamp 2...7 are ASI rings */ 92267f4addbSFrank Haverkamp addr = GENWQE_UID_OFFS(uid) | IO_EXTENDED_DIAG_MAP(ring); 92367f4addbSFrank Haverkamp val = __genwqe_readq(cd, addr); 92467f4addbSFrank Haverkamp 92567f4addbSFrank Haverkamp if ((val == 0x0ull) || (val == -1ull)) 92667f4addbSFrank Haverkamp continue; 92767f4addbSFrank Haverkamp 92867f4addbSFrank Haverkamp traps = (val >> 24) & 0xff; /* Number of Traps */ 92967f4addbSFrank Haverkamp traces = (val >> 16) & 0xff; /* Number of Traces */ 93067f4addbSFrank Haverkamp trace_entries = val & 0xffff; /* Entries per trace */ 93167f4addbSFrank Haverkamp 93267f4addbSFrank Haverkamp /* Note: This is a combined loop that dumps both the traps */ 93367f4addbSFrank Haverkamp /* (for the trace == 0 case) as well as the traces 1 to */ 93467f4addbSFrank Haverkamp /* 'traces'. */ 93567f4addbSFrank Haverkamp for (trace = 0; trace <= traces; trace++) { 93667f4addbSFrank Haverkamp u32 diag_sel = 93767f4addbSFrank Haverkamp GENWQE_EXTENDED_DIAG_SELECTOR(ring, trace); 93867f4addbSFrank Haverkamp 93967f4addbSFrank Haverkamp addr = (GENWQE_UID_OFFS(uid) | 94067f4addbSFrank Haverkamp IO_EXTENDED_DIAG_SELECTOR); 94167f4addbSFrank Haverkamp __genwqe_writeq(cd, addr, diag_sel); 94267f4addbSFrank Haverkamp 94367f4addbSFrank Haverkamp for (trace_entry = 0; 94467f4addbSFrank Haverkamp trace_entry < (trace ? trace_entries : traps); 94567f4addbSFrank Haverkamp trace_entry++) { 94667f4addbSFrank Haverkamp addr = (GENWQE_UID_OFFS(uid) | 94767f4addbSFrank Haverkamp IO_EXTENDED_DIAG_READ_MBX); 94867f4addbSFrank Haverkamp val = __genwqe_readq(cd, addr); 94967f4addbSFrank Haverkamp set_reg_idx(cd, regs, &idx, max_regs, addr, 95067f4addbSFrank Haverkamp (diag_sel<<16) | trace_entry, val); 95167f4addbSFrank Haverkamp } 95267f4addbSFrank Haverkamp } 95367f4addbSFrank Haverkamp } 95467f4addbSFrank Haverkamp return 0; 95567f4addbSFrank Haverkamp } 95667f4addbSFrank Haverkamp 95767f4addbSFrank Haverkamp /** 95867f4addbSFrank Haverkamp * genwqe_write_vreg() - Write register in virtual window 95967f4addbSFrank Haverkamp * 96067f4addbSFrank Haverkamp * Note, these registers are only accessible to the PF through the 96167f4addbSFrank Haverkamp * VF-window. It is not intended for the VF to access. 96267f4addbSFrank Haverkamp */ 96367f4addbSFrank Haverkamp int genwqe_write_vreg(struct genwqe_dev *cd, u32 reg, u64 val, int func) 96467f4addbSFrank Haverkamp { 96567f4addbSFrank Haverkamp __genwqe_writeq(cd, IO_PF_SLC_VIRTUAL_WINDOW, func & 0xf); 96667f4addbSFrank Haverkamp __genwqe_writeq(cd, reg, val); 96767f4addbSFrank Haverkamp return 0; 96867f4addbSFrank Haverkamp } 96967f4addbSFrank Haverkamp 97067f4addbSFrank Haverkamp /** 97167f4addbSFrank Haverkamp * genwqe_read_vreg() - Read register in virtual window 97267f4addbSFrank Haverkamp * 97367f4addbSFrank Haverkamp * Note, these registers are only accessible to the PF through the 97467f4addbSFrank Haverkamp * VF-window. It is not intended for the VF to access. 97567f4addbSFrank Haverkamp */ 97667f4addbSFrank Haverkamp u64 genwqe_read_vreg(struct genwqe_dev *cd, u32 reg, int func) 97767f4addbSFrank Haverkamp { 97867f4addbSFrank Haverkamp __genwqe_writeq(cd, IO_PF_SLC_VIRTUAL_WINDOW, func & 0xf); 97967f4addbSFrank Haverkamp return __genwqe_readq(cd, reg); 98067f4addbSFrank Haverkamp } 98167f4addbSFrank Haverkamp 98267f4addbSFrank Haverkamp /** 98367f4addbSFrank Haverkamp * genwqe_base_clock_frequency() - Deteremine base clock frequency of the card 98467f4addbSFrank Haverkamp * 98567f4addbSFrank Haverkamp * Note: From a design perspective it turned out to be a bad idea to 98667f4addbSFrank Haverkamp * use codes here to specifiy the frequency/speed values. An old 98767f4addbSFrank Haverkamp * driver cannot understand new codes and is therefore always a 98867f4addbSFrank Haverkamp * problem. Better is to measure out the value or put the 98967f4addbSFrank Haverkamp * speed/frequency directly into a register which is always a valid 99067f4addbSFrank Haverkamp * value for old as well as for new software. 99167f4addbSFrank Haverkamp * 99267f4addbSFrank Haverkamp * Return: Card clock in MHz 99367f4addbSFrank Haverkamp */ 99467f4addbSFrank Haverkamp int genwqe_base_clock_frequency(struct genwqe_dev *cd) 99567f4addbSFrank Haverkamp { 99667f4addbSFrank Haverkamp u16 speed; /* MHz MHz MHz MHz */ 99767f4addbSFrank Haverkamp static const int speed_grade[] = { 250, 200, 166, 175 }; 99867f4addbSFrank Haverkamp 99967f4addbSFrank Haverkamp speed = (u16)((cd->slu_unitcfg >> 28) & 0x0full); 100067f4addbSFrank Haverkamp if (speed >= ARRAY_SIZE(speed_grade)) 100167f4addbSFrank Haverkamp return 0; /* illegal value */ 100267f4addbSFrank Haverkamp 100367f4addbSFrank Haverkamp return speed_grade[speed]; 100467f4addbSFrank Haverkamp } 100567f4addbSFrank Haverkamp 100667f4addbSFrank Haverkamp /** 100767f4addbSFrank Haverkamp * genwqe_stop_traps() - Stop traps 100867f4addbSFrank Haverkamp * 100967f4addbSFrank Haverkamp * Before reading out the analysis data, we need to stop the traps. 101067f4addbSFrank Haverkamp */ 101167f4addbSFrank Haverkamp void genwqe_stop_traps(struct genwqe_dev *cd) 101267f4addbSFrank Haverkamp { 101367f4addbSFrank Haverkamp __genwqe_writeq(cd, IO_SLC_MISC_DEBUG_SET, 0xcull); 101467f4addbSFrank Haverkamp } 101567f4addbSFrank Haverkamp 101667f4addbSFrank Haverkamp /** 101767f4addbSFrank Haverkamp * genwqe_start_traps() - Start traps 101867f4addbSFrank Haverkamp * 101967f4addbSFrank Haverkamp * After having read the data, we can/must enable the traps again. 102067f4addbSFrank Haverkamp */ 102167f4addbSFrank Haverkamp void genwqe_start_traps(struct genwqe_dev *cd) 102267f4addbSFrank Haverkamp { 102367f4addbSFrank Haverkamp __genwqe_writeq(cd, IO_SLC_MISC_DEBUG_CLR, 0xcull); 102467f4addbSFrank Haverkamp 102567f4addbSFrank Haverkamp if (genwqe_need_err_masking(cd)) 102667f4addbSFrank Haverkamp __genwqe_writeq(cd, IO_SLC_MISC_DEBUG, 0x0aull); 102767f4addbSFrank Haverkamp } 1028