#ifndef __CARD_BASE_H__ #define __CARD_BASE_H__ /** * IBM Accelerator Family 'GenWQE' * * (C) Copyright IBM Corp. 2013 * * Author: Frank Haverkamp <haver@linux.vnet.ibm.com> * Author: Joerg-Stephan Vogt <jsvogt@de.ibm.com> * Author: Michael Jung <mijung@de.ibm.com> * Author: Michael Ruettger <michael@ibmra.de> * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License (version 2 only) * as published by the Free Software Foundation. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. */ /* * Interfaces within the GenWQE module. Defines genwqe_card and * ddcb_queue as well as ddcb_requ. */ #include <linux/kernel.h> #include <linux/types.h> #include <linux/cdev.h> #include <linux/stringify.h> #include <linux/pci.h> #include <linux/semaphore.h> #include <linux/uaccess.h> #include <linux/io.h> #include <linux/version.h> #include <linux/debugfs.h> #include <linux/slab.h> #include <linux/genwqe/genwqe_card.h> #include "genwqe_driver.h" #define GENWQE_MSI_IRQS 4 /* Just one supported, no MSIx */ #define GENWQE_FLAG_MSI_ENABLED (1 << 0) #define GENWQE_MAX_VFS 15 /* maximum 15 VFs are possible */ #define GENWQE_MAX_FUNCS 16 /* 1 PF and 15 VFs */ #define GENWQE_CARD_NO_MAX (16 * GENWQE_MAX_FUNCS) /* Compile parameters, some of them appear in debugfs for later adjustment */ #define genwqe_ddcb_max 32 /* DDCBs on the work-queue */ #define genwqe_polling_enabled 0 /* in case of irqs not working */ #define genwqe_ddcb_software_timeout 10 /* timeout per DDCB in seconds */ #define genwqe_kill_timeout 8 /* time until process gets killed */ #define genwqe_vf_jobtimeout_msec 250 /* 250 msec */ #define genwqe_pf_jobtimeout_msec 8000 /* 8 sec should be ok */ #define genwqe_health_check_interval 4 /* <= 0: disabled */ /* Sysfs attribute groups used when we create the genwqe device */ extern const struct attribute_group *genwqe_attribute_groups[]; /* * Config space for Genwqe5 A7: * 00:[14 10 4b 04]40 00 10 00[00 00 00 12]00 00 00 00 * 10: 0c 00 00 f0 07 3c 00 00 00 00 00 00 00 00 00 00 * 20: 00 00 00 00 00 00 00 00 00 00 00 00[14 10 4b 04] * 30: 00 00 00 00 50 00 00 00 00 00 00 00 00 00 00 00 */ #define PCI_DEVICE_GENWQE 0x044b /* Genwqe DeviceID */ #define PCI_SUBSYSTEM_ID_GENWQE5 0x035f /* Genwqe A5 Subsystem-ID */ #define PCI_SUBSYSTEM_ID_GENWQE5_NEW 0x044b /* Genwqe A5 Subsystem-ID */ #define PCI_CLASSCODE_GENWQE5 0x1200 /* UNKNOWN */ #define PCI_SUBVENDOR_ID_IBM_SRIOV 0x0000 #define PCI_SUBSYSTEM_ID_GENWQE5_SRIOV 0x0000 /* Genwqe A5 Subsystem-ID */ #define PCI_CLASSCODE_GENWQE5_SRIOV 0x1200 /* UNKNOWN */ #define GENWQE_SLU_ARCH_REQ 2 /* Required SLU architecture level */ /** * struct genwqe_reg - Genwqe data dump functionality */ struct genwqe_reg { u32 addr; u32 idx; u64 val; }; /* * enum genwqe_dbg_type - Specify chip unit to dump/debug */ enum genwqe_dbg_type { GENWQE_DBG_UNIT0 = 0, /* captured before prev errs cleared */ GENWQE_DBG_UNIT1 = 1, GENWQE_DBG_UNIT2 = 2, GENWQE_DBG_UNIT3 = 3, GENWQE_DBG_UNIT4 = 4, GENWQE_DBG_UNIT5 = 5, GENWQE_DBG_UNIT6 = 6, GENWQE_DBG_UNIT7 = 7, GENWQE_DBG_REGS = 8, GENWQE_DBG_DMA = 9, GENWQE_DBG_UNITS = 10, /* max number of possible debug units */ }; /* Software error injection to simulate card failures */ #define GENWQE_INJECT_HARDWARE_FAILURE 0x00000001 /* injects -1 reg reads */ #define GENWQE_INJECT_BUS_RESET_FAILURE 0x00000002 /* pci_bus_reset fail */ #define GENWQE_INJECT_GFIR_FATAL 0x00000004 /* GFIR = 0x0000ffff */ #define GENWQE_INJECT_GFIR_INFO 0x00000008 /* GFIR = 0xffff0000 */ /* * Genwqe card description and management data. * * Error-handling in case of card malfunction * ------------------------------------------ * * If the card is detected to be defective the outside environment * will cause the PCI layer to call deinit (the cleanup function for * probe). This is the same effect like doing a unbind/bind operation * on the card. * * The genwqe card driver implements a health checking thread which * verifies the card function. If this detects a problem the cards * device is being shutdown and restarted again, along with a reset of * the card and queue. * * All functions accessing the card device return either -EIO or -ENODEV * code to indicate the malfunction to the user. The user has to close * the file descriptor and open a new one, once the card becomes * available again. * * If the open file descriptor is setup to receive SIGIO, the signal is * genereated for the application which has to provide a handler to * react on it. If the application does not close the open * file descriptor a SIGKILL is send to enforce freeing the cards * resources. * * I did not find a different way to prevent kernel problems due to * reference counters for the cards character devices getting out of * sync. The character device deallocation does not block, even if * there is still an open file descriptor pending. If this pending * descriptor is closed, the data structures used by the character * device is reinstantiated, which will lead to the reference counter * dropping below the allowed values. * * Card recovery * ------------- * * To test the internal driver recovery the following command can be used: * sudo sh -c 'echo 0xfffff > /sys/class/genwqe/genwqe0_card/err_inject' */ /** * struct dma_mapping_type - Mapping type definition * * To avoid memcpying data arround we use user memory directly. To do * this we need to pin/swap-in the memory and request a DMA address * for it. */ enum dma_mapping_type { GENWQE_MAPPING_RAW = 0, /* contignous memory buffer */ GENWQE_MAPPING_SGL_TEMP, /* sglist dynamically used */ GENWQE_MAPPING_SGL_PINNED, /* sglist used with pinning */ }; /** * struct dma_mapping - Information about memory mappings done by the driver */ struct dma_mapping { enum dma_mapping_type type; void *u_vaddr; /* user-space vaddr/non-aligned */ void *k_vaddr; /* kernel-space vaddr/non-aligned */ dma_addr_t dma_addr; /* physical DMA address */ struct page **page_list; /* list of pages used by user buff */ dma_addr_t *dma_list; /* list of dma addresses per page */ unsigned int nr_pages; /* number of pages */ unsigned int size; /* size in bytes */ struct list_head card_list; /* list of usr_maps for card */ struct list_head pin_list; /* list of pinned memory for dev */ }; static inline void genwqe_mapping_init(struct dma_mapping *m, enum dma_mapping_type type) { memset(m, 0, sizeof(*m)); m->type = type; } /** * struct ddcb_queue - DDCB queue data * @ddcb_max: Number of DDCBs on the queue * @ddcb_next: Next free DDCB * @ddcb_act: Next DDCB supposed to finish * @ddcb_seq: Sequence number of last DDCB * @ddcbs_in_flight: Currently enqueued DDCBs * @ddcbs_completed: Number of already completed DDCBs * @busy: Number of -EBUSY returns * @ddcb_daddr: DMA address of first DDCB in the queue * @ddcb_vaddr: Kernel virtual address of first DDCB in the queue * @ddcb_req: Associated requests (one per DDCB) * @ddcb_waitqs: Associated wait queues (one per DDCB) * @ddcb_lock: Lock to protect queuing operations * @ddcb_waitq: Wait on next DDCB finishing */ struct ddcb_queue { int ddcb_max; /* amount of DDCBs */ int ddcb_next; /* next available DDCB num */ int ddcb_act; /* DDCB to be processed */ u16 ddcb_seq; /* slc seq num */ unsigned int ddcbs_in_flight; /* number of ddcbs in processing */ unsigned int ddcbs_completed; unsigned int ddcbs_max_in_flight; unsigned int busy; /* how many times -EBUSY? */ dma_addr_t ddcb_daddr; /* DMA address */ struct ddcb *ddcb_vaddr; /* kernel virtual addr for DDCBs */ struct ddcb_requ **ddcb_req; /* ddcb processing parameter */ wait_queue_head_t *ddcb_waitqs; /* waitqueue per ddcb */ spinlock_t ddcb_lock; /* exclusive access to queue */ wait_queue_head_t ddcb_waitq; /* wait for ddcb processing */ /* registers or the respective queue to be used */ u32 IO_QUEUE_CONFIG; u32 IO_QUEUE_STATUS; u32 IO_QUEUE_SEGMENT; u32 IO_QUEUE_INITSQN; u32 IO_QUEUE_WRAP; u32 IO_QUEUE_OFFSET; u32 IO_QUEUE_WTIME; u32 IO_QUEUE_ERRCNTS; u32 IO_QUEUE_LRW; }; /* * GFIR, SLU_UNITCFG, APP_UNITCFG * 8 Units with FIR/FEC + 64 * 2ndary FIRS/FEC. */ #define GENWQE_FFDC_REGS (3 + (8 * (2 + 2 * 64))) struct genwqe_ffdc { unsigned int entries; struct genwqe_reg *regs; }; /** * struct genwqe_dev - GenWQE device information * @card_state: Card operation state, see above * @ffdc: First Failure Data Capture buffers for each unit * @card_thread: Working thread to operate the DDCB queue * @card_waitq: Wait queue used in card_thread * @queue: DDCB queue * @health_thread: Card monitoring thread (only for PFs) * @health_waitq: Wait queue used in health_thread * @pci_dev: Associated PCI device (function) * @mmio: Base address of 64-bit register space * @mmio_len: Length of register area * @file_lock: Lock to protect access to file_list * @file_list: List of all processes with open GenWQE file descriptors * * This struct contains all information needed to communicate with a * GenWQE card. It is initialized when a GenWQE device is found and * destroyed when it goes away. It holds data to maintain the queue as * well as data needed to feed the user interfaces. */ struct genwqe_dev { enum genwqe_card_state card_state; spinlock_t print_lock; int card_idx; /* card index 0..CARD_NO_MAX-1 */ u64 flags; /* general flags */ /* FFDC data gathering */ struct genwqe_ffdc ffdc[GENWQE_DBG_UNITS]; /* DDCB workqueue */ struct task_struct *card_thread; wait_queue_head_t queue_waitq; struct ddcb_queue queue; /* genwqe DDCB queue */ unsigned int irqs_processed; /* Card health checking thread */ struct task_struct *health_thread; wait_queue_head_t health_waitq; /* char device */ dev_t devnum_genwqe; /* major/minor num card */ struct class *class_genwqe; /* reference to class object */ struct device *dev; /* for device creation */ struct cdev cdev_genwqe; /* char device for card */ struct dentry *debugfs_root; /* debugfs card root directory */ struct dentry *debugfs_genwqe; /* debugfs driver root directory */ /* pci resources */ struct pci_dev *pci_dev; /* PCI device */ void __iomem *mmio; /* BAR-0 MMIO start */ unsigned long mmio_len; u16 num_vfs; u32 vf_jobtimeout_msec[GENWQE_MAX_VFS]; int is_privileged; /* access to all regs possible */ /* config regs which we need often */ u64 slu_unitcfg; u64 app_unitcfg; u64 softreset; u64 err_inject; u64 last_gfir; char app_name[5]; spinlock_t file_lock; /* lock for open files */ struct list_head file_list; /* list of open files */ /* debugfs parameters */ int ddcb_software_timeout; /* wait until DDCB times out */ int skip_recovery; /* circumvention if recovery fails */ int kill_timeout; /* wait after sending SIGKILL */ }; /** * enum genwqe_requ_state - State of a DDCB execution request */ enum genwqe_requ_state { GENWQE_REQU_NEW = 0, GENWQE_REQU_ENQUEUED = 1, GENWQE_REQU_TAPPED = 2, GENWQE_REQU_FINISHED = 3, GENWQE_REQU_STATE_MAX, }; /** * struct ddcb_requ - Kernel internal representation of the DDCB request * @cmd: User space representation of the DDCB execution request */ struct ddcb_requ { /* kernel specific content */ enum genwqe_requ_state req_state; /* request status */ int num; /* ddcb_no for this request */ struct ddcb_queue *queue; /* associated queue */ struct dma_mapping dma_mappings[DDCB_FIXUPS]; struct sg_entry *sgl[DDCB_FIXUPS]; dma_addr_t sgl_dma_addr[DDCB_FIXUPS]; size_t sgl_size[DDCB_FIXUPS]; /* kernel/user shared content */ struct genwqe_ddcb_cmd cmd; /* ddcb_no for this request */ struct genwqe_debug_data debug_data; }; /** * struct genwqe_file - Information for open GenWQE devices */ struct genwqe_file { struct genwqe_dev *cd; struct genwqe_driver *client; struct file *filp; struct fasync_struct *async_queue; struct task_struct *owner; struct list_head list; /* entry in list of open files */ spinlock_t map_lock; /* lock for dma_mappings */ struct list_head map_list; /* list of dma_mappings */ spinlock_t pin_lock; /* lock for pinned memory */ struct list_head pin_list; /* list of pinned memory */ }; int genwqe_setup_service_layer(struct genwqe_dev *cd); /* for PF only */ int genwqe_finish_queue(struct genwqe_dev *cd); int genwqe_release_service_layer(struct genwqe_dev *cd); /** * genwqe_get_slu_id() - Read Service Layer Unit Id * Return: 0x00: Development code * 0x01: SLC1 (old) * 0x02: SLC2 (sept2012) * 0x03: SLC2 (feb2013, generic driver) */ static inline int genwqe_get_slu_id(struct genwqe_dev *cd) { return (int)((cd->slu_unitcfg >> 32) & 0xff); } int genwqe_ddcbs_in_flight(struct genwqe_dev *cd); u8 genwqe_card_type(struct genwqe_dev *cd); int genwqe_card_reset(struct genwqe_dev *cd); int genwqe_set_interrupt_capability(struct genwqe_dev *cd, int count); void genwqe_reset_interrupt_capability(struct genwqe_dev *cd); int genwqe_device_create(struct genwqe_dev *cd); int genwqe_device_remove(struct genwqe_dev *cd); /* debugfs */ int genwqe_init_debugfs(struct genwqe_dev *cd); void genqwe_exit_debugfs(struct genwqe_dev *cd); int genwqe_read_softreset(struct genwqe_dev *cd); /* Hardware Circumventions */ int genwqe_recovery_on_fatal_gfir_required(struct genwqe_dev *cd); int genwqe_flash_readback_fails(struct genwqe_dev *cd); /** * genwqe_write_vreg() - Write register in VF window * @cd: genwqe device * @reg: register address * @val: value to write * @func: 0: PF, 1: VF0, ..., 15: VF14 */ int genwqe_write_vreg(struct genwqe_dev *cd, u32 reg, u64 val, int func); /** * genwqe_read_vreg() - Read register in VF window * @cd: genwqe device * @reg: register address * @func: 0: PF, 1: VF0, ..., 15: VF14 * * Return: content of the register */ u64 genwqe_read_vreg(struct genwqe_dev *cd, u32 reg, int func); /* FFDC Buffer Management */ int genwqe_ffdc_buff_size(struct genwqe_dev *cd, int unit_id); int genwqe_ffdc_buff_read(struct genwqe_dev *cd, int unit_id, struct genwqe_reg *regs, unsigned int max_regs); int genwqe_read_ffdc_regs(struct genwqe_dev *cd, struct genwqe_reg *regs, unsigned int max_regs, int all); int genwqe_ffdc_dump_dma(struct genwqe_dev *cd, struct genwqe_reg *regs, unsigned int max_regs); int genwqe_init_debug_data(struct genwqe_dev *cd, struct genwqe_debug_data *d); void genwqe_init_crc32(void); int genwqe_read_app_id(struct genwqe_dev *cd, char *app_name, int len); /* Memory allocation/deallocation; dma address handling */ int genwqe_user_vmap(struct genwqe_dev *cd, struct dma_mapping *m, void *uaddr, unsigned long size, struct ddcb_requ *req); int genwqe_user_vunmap(struct genwqe_dev *cd, struct dma_mapping *m, struct ddcb_requ *req); struct sg_entry *genwqe_alloc_sgl(struct genwqe_dev *cd, int num_pages, dma_addr_t *dma_addr, size_t *sgl_size); void genwqe_free_sgl(struct genwqe_dev *cd, struct sg_entry *sg_list, dma_addr_t dma_addr, size_t size); int genwqe_setup_sgl(struct genwqe_dev *cd, unsigned long offs, unsigned long size, struct sg_entry *sgl, /* genwqe sgl */ dma_addr_t dma_addr, size_t sgl_size, dma_addr_t *dma_list, int page_offs, int num_pages); int genwqe_check_sgl(struct genwqe_dev *cd, struct sg_entry *sg_list, int size); static inline bool dma_mapping_used(struct dma_mapping *m) { if (!m) return 0; return m->size != 0; } /** * __genwqe_execute_ddcb() - Execute DDCB request with addr translation * * This function will do the address translation changes to the DDCBs * according to the definitions required by the ATS field. It looks up * the memory allocation buffer or does vmap/vunmap for the respective * user-space buffers, inclusive page pinning and scatter gather list * buildup and teardown. */ int __genwqe_execute_ddcb(struct genwqe_dev *cd, struct genwqe_ddcb_cmd *cmd); /** * __genwqe_execute_raw_ddcb() - Execute DDCB request without addr translation * * This version will not do address translation or any modifcation of * the DDCB data. It is used e.g. for the MoveFlash DDCB which is * entirely prepared by the driver itself. That means the appropriate * DMA addresses are already in the DDCB and do not need any * modification. */ int __genwqe_execute_raw_ddcb(struct genwqe_dev *cd, struct genwqe_ddcb_cmd *cmd); int __genwqe_enqueue_ddcb(struct genwqe_dev *cd, struct ddcb_requ *req); int __genwqe_wait_ddcb(struct genwqe_dev *cd, struct ddcb_requ *req); int __genwqe_purge_ddcb(struct genwqe_dev *cd, struct ddcb_requ *req); /* register access */ int __genwqe_writeq(struct genwqe_dev *cd, u64 byte_offs, u64 val); u64 __genwqe_readq(struct genwqe_dev *cd, u64 byte_offs); int __genwqe_writel(struct genwqe_dev *cd, u64 byte_offs, u32 val); u32 __genwqe_readl(struct genwqe_dev *cd, u64 byte_offs); void *__genwqe_alloc_consistent(struct genwqe_dev *cd, size_t size, dma_addr_t *dma_handle); void __genwqe_free_consistent(struct genwqe_dev *cd, size_t size, void *vaddr, dma_addr_t dma_handle); /* Base clock frequency in MHz */ int genwqe_base_clock_frequency(struct genwqe_dev *cd); /* Before FFDC is captured the traps should be stopped. */ void genwqe_stop_traps(struct genwqe_dev *cd); void genwqe_start_traps(struct genwqe_dev *cd); /* Hardware circumvention */ bool genwqe_need_err_masking(struct genwqe_dev *cd); /** * genwqe_is_privileged() - Determine operation mode for PCI function * * On Intel with SRIOV support we see: * PF: is_physfn = 1 is_virtfn = 0 * VF: is_physfn = 0 is_virtfn = 1 * * On Systems with no SRIOV support _and_ virtualized systems we get: * is_physfn = 0 is_virtfn = 0 * * Other vendors have individual pci device ids to distinguish between * virtual function drivers and physical function drivers. GenWQE * unfortunately has just on pci device id for both, VFs and PF. * * The following code is used to distinguish if the card is running in * privileged mode, either as true PF or in a virtualized system with * full register access e.g. currently on PowerPC. * * if (pci_dev->is_virtfn) * cd->is_privileged = 0; * else * cd->is_privileged = (__genwqe_readq(cd, IO_SLU_BITSTREAM) * != IO_ILLEGAL_VALUE); */ static inline int genwqe_is_privileged(struct genwqe_dev *cd) { return cd->is_privileged; } #endif /* __CARD_BASE_H__ */