diff options
Diffstat (limited to 'contrib/syslinux-4.02/gpxe/src/drivers/infiniband/hermon.h')
-rw-r--r-- | contrib/syslinux-4.02/gpxe/src/drivers/infiniband/hermon.h | 610 |
1 files changed, 610 insertions, 0 deletions
diff --git a/contrib/syslinux-4.02/gpxe/src/drivers/infiniband/hermon.h b/contrib/syslinux-4.02/gpxe/src/drivers/infiniband/hermon.h new file mode 100644 index 0000000..c53f3da --- /dev/null +++ b/contrib/syslinux-4.02/gpxe/src/drivers/infiniband/hermon.h @@ -0,0 +1,610 @@ +#ifndef _HERMON_H +#define _HERMON_H + +/** @file + * + * Mellanox Hermon Infiniband HCA driver + * + */ + +FILE_LICENCE ( GPL2_OR_LATER ); + +#include <stdint.h> +#include <gpxe/uaccess.h> +#include <gpxe/ib_packet.h> +#include "mlx_bitops.h" +#include "MT25408_PRM.h" + +/* + * Hardware constants + * + */ + +/* Ports in existence */ +#define HERMON_MAX_PORTS 2 +#define HERMON_PORT_BASE 1 + +/* PCI BARs */ +#define HERMON_PCI_CONFIG_BAR PCI_BASE_ADDRESS_0 +#define HERMON_PCI_CONFIG_BAR_SIZE 0x100000 +#define HERMON_PCI_UAR_BAR PCI_BASE_ADDRESS_2 + +/* Device reset */ +#define HERMON_RESET_OFFSET 0x0f0010 +#define HERMON_RESET_MAGIC 0x01000000UL +#define HERMON_RESET_WAIT_TIME_MS 1000 + +/* Work queue entry and completion queue entry opcodes */ +#define HERMON_OPCODE_NOP 0x00 +#define HERMON_OPCODE_SEND 0x0a +#define HERMON_OPCODE_RECV_ERROR 0xfe +#define HERMON_OPCODE_SEND_ERROR 0xff + +/* HCA command register opcodes */ +#define HERMON_HCR_QUERY_DEV_CAP 0x0003 +#define HERMON_HCR_QUERY_FW 0x0004 +#define HERMON_HCR_INIT_HCA 0x0007 +#define HERMON_HCR_CLOSE_HCA 0x0008 +#define HERMON_HCR_INIT_PORT 0x0009 +#define HERMON_HCR_CLOSE_PORT 0x000a +#define HERMON_HCR_SW2HW_MPT 0x000d +#define HERMON_HCR_WRITE_MTT 0x0011 +#define HERMON_HCR_MAP_EQ 0x0012 +#define HERMON_HCR_SW2HW_EQ 0x0013 +#define HERMON_HCR_HW2SW_EQ 0x0014 +#define HERMON_HCR_QUERY_EQ 0x0015 +#define HERMON_HCR_SW2HW_CQ 0x0016 +#define HERMON_HCR_HW2SW_CQ 0x0017 +#define HERMON_HCR_RST2INIT_QP 0x0019 +#define HERMON_HCR_INIT2RTR_QP 0x001a +#define HERMON_HCR_RTR2RTS_QP 0x001b +#define HERMON_HCR_RTS2RTS_QP 0x001c +#define HERMON_HCR_2RST_QP 0x0021 +#define HERMON_HCR_QUERY_QP 0x0022 +#define HERMON_HCR_CONF_SPECIAL_QP 0x0023 +#define HERMON_HCR_MAD_IFC 0x0024 +#define HERMON_HCR_READ_MCG 0x0025 +#define HERMON_HCR_WRITE_MCG 0x0026 +#define HERMON_HCR_MGID_HASH 0x0027 +#define HERMON_HCR_SENSE_PORT 0x004d +#define HERMON_HCR_RUN_FW 0x0ff6 +#define HERMON_HCR_DISABLE_LAM 0x0ff7 +#define HERMON_HCR_ENABLE_LAM 0x0ff8 +#define HERMON_HCR_UNMAP_ICM 0x0ff9 +#define HERMON_HCR_MAP_ICM 0x0ffa +#define HERMON_HCR_UNMAP_ICM_AUX 0x0ffb +#define HERMON_HCR_MAP_ICM_AUX 0x0ffc +#define HERMON_HCR_SET_ICM_SIZE 0x0ffd +#define HERMON_HCR_UNMAP_FA 0x0ffe +#define HERMON_HCR_MAP_FA 0x0fff + +/* Service types */ +#define HERMON_ST_RC 0x00 +#define HERMON_ST_UD 0x03 +#define HERMON_ST_MLX 0x07 + +/* MTUs */ +#define HERMON_MTU_2048 0x04 + +#define HERMON_INVALID_LKEY 0x00000100UL + +#define HERMON_PAGE_SIZE 4096 + +#define HERMON_DB_POST_SND_OFFSET 0x14 +#define HERMON_DB_EQ_OFFSET(_eqn) \ + ( 0x800 + HERMON_PAGE_SIZE * ( (_eqn) / 4 ) + 0x08 * ( (_eqn) % 4 ) ) + +#define HERMON_QP_OPT_PARAM_PM_STATE 0x00000400UL +#define HERMON_QP_OPT_PARAM_QKEY 0x00000020UL +#define HERMON_QP_OPT_PARAM_ALT_PATH 0x00000001UL + +#define HERMON_MAP_EQ ( 0UL << 31 ) +#define HERMON_UNMAP_EQ ( 1UL << 31 ) + +#define HERMON_EV_PORT_STATE_CHANGE 0x09 + +#define HERMON_SCHED_QP0 0x3f +#define HERMON_SCHED_DEFAULT 0x83 + +#define HERMON_PM_STATE_ARMED 0x00 +#define HERMON_PM_STATE_REARM 0x01 +#define HERMON_PM_STATE_MIGRATED 0x03 + +#define HERMON_RETRY_MAX 0x07 + +/* + * Datatypes that seem to be missing from the autogenerated documentation + * + */ +struct hermonprm_mgm_hash_st { + pseudo_bit_t reserved0[0x00020]; +/* -------------- */ + pseudo_bit_t hash[0x00010]; + pseudo_bit_t reserved1[0x00010]; +} __attribute__ (( packed )); + +struct hermonprm_mcg_entry_st { + struct hermonprm_mcg_hdr_st hdr; + struct hermonprm_mcg_qp_dw_st qp[8]; +} __attribute__ (( packed )); + +struct hermonprm_cq_db_record_st { + pseudo_bit_t update_ci[0x00018]; + pseudo_bit_t reserved0[0x00008]; +/* -------------- */ + pseudo_bit_t arm_ci[0x00018]; + pseudo_bit_t cmd[0x00003]; + pseudo_bit_t reserved1[0x00001]; + pseudo_bit_t cmd_sn[0x00002]; + pseudo_bit_t reserved2[0x00002]; +} __attribute__ (( packed )); + +struct hermonprm_send_db_register_st { + pseudo_bit_t reserved[0x00008]; + pseudo_bit_t qn[0x00018]; +} __attribute__ (( packed )); + +struct hermonprm_event_db_register_st { + pseudo_bit_t ci[0x00018]; + pseudo_bit_t reserver[0x00007]; + pseudo_bit_t a[0x00001]; +} __attribute__ (( packed )); + +struct hermonprm_scalar_parameter_st { + pseudo_bit_t value_hi[0x00020]; +/* -------------- */ + pseudo_bit_t value[0x00020]; +} __attribute__ (( packed )); + +struct hermonprm_event_mask_st { + pseudo_bit_t reserved0[0x00020]; +/* -------------- */ + pseudo_bit_t completion[0x00001]; + pseudo_bit_t reserved1[0x0008]; + pseudo_bit_t port_state_change[0x00001]; + pseudo_bit_t reserved2[0x00016]; +} __attribute__ (( packed )); + +struct hermonprm_port_state_change_event_st { + pseudo_bit_t reserved[0x00020]; + struct hermonprm_port_state_change_st data; +} __attribute__ (( packed )); + +/** Hermon sense port */ +struct hermonprm_sense_port_st { + pseudo_bit_t port_type[0x00020]; +/* -------------- */ + pseudo_bit_t reserved[0x00020]; +}; +#define HERMON_PORT_TYPE_IB 1 + +/* + * Wrapper structures for hardware datatypes + * + */ + +struct MLX_DECLARE_STRUCT ( hermonprm_completion_queue_context ); +struct MLX_DECLARE_STRUCT ( hermonprm_completion_queue_entry ); +struct MLX_DECLARE_STRUCT ( hermonprm_completion_with_error ); +struct MLX_DECLARE_STRUCT ( hermonprm_cq_db_record ); +struct MLX_DECLARE_STRUCT ( hermonprm_eqc ); +struct MLX_DECLARE_STRUCT ( hermonprm_event_db_register ); +struct MLX_DECLARE_STRUCT ( hermonprm_event_mask ); +struct MLX_DECLARE_STRUCT ( hermonprm_event_queue_entry ); +struct MLX_DECLARE_STRUCT ( hermonprm_hca_command_register ); +struct MLX_DECLARE_STRUCT ( hermonprm_init_hca ); +struct MLX_DECLARE_STRUCT ( hermonprm_init_port ); +struct MLX_DECLARE_STRUCT ( hermonprm_mad_ifc ); +struct MLX_DECLARE_STRUCT ( hermonprm_mcg_entry ); +struct MLX_DECLARE_STRUCT ( hermonprm_mgm_hash ); +struct MLX_DECLARE_STRUCT ( hermonprm_mpt ); +struct MLX_DECLARE_STRUCT ( hermonprm_mtt ); +struct MLX_DECLARE_STRUCT ( hermonprm_port_state_change_event ); +struct MLX_DECLARE_STRUCT ( hermonprm_qp_db_record ); +struct MLX_DECLARE_STRUCT ( hermonprm_qp_ee_state_transitions ); +struct MLX_DECLARE_STRUCT ( hermonprm_query_dev_cap ); +struct MLX_DECLARE_STRUCT ( hermonprm_query_fw ); +struct MLX_DECLARE_STRUCT ( hermonprm_queue_pair_ee_context_entry ); +struct MLX_DECLARE_STRUCT ( hermonprm_scalar_parameter ); +struct MLX_DECLARE_STRUCT ( hermonprm_sense_port ); +struct MLX_DECLARE_STRUCT ( hermonprm_send_db_register ); +struct MLX_DECLARE_STRUCT ( hermonprm_ud_address_vector ); +struct MLX_DECLARE_STRUCT ( hermonprm_virtual_physical_mapping ); +struct MLX_DECLARE_STRUCT ( hermonprm_wqe_segment_ctrl_mlx ); +struct MLX_DECLARE_STRUCT ( hermonprm_wqe_segment_ctrl_send ); +struct MLX_DECLARE_STRUCT ( hermonprm_wqe_segment_data_ptr ); +struct MLX_DECLARE_STRUCT ( hermonprm_wqe_segment_ud ); + +/* + * Composite hardware datatypes + * + */ + +struct hermonprm_write_mtt { + struct hermonprm_scalar_parameter mtt_base_addr; + struct hermonprm_scalar_parameter reserved; + struct hermonprm_mtt mtt; +} __attribute__ (( packed )); + +#define HERMON_MAX_GATHER 2 + +struct hermonprm_ud_send_wqe { + struct hermonprm_wqe_segment_ctrl_send ctrl; + struct hermonprm_wqe_segment_ud ud; + struct hermonprm_wqe_segment_data_ptr data[HERMON_MAX_GATHER]; +} __attribute__ (( packed )); + +struct hermonprm_mlx_send_wqe { + struct hermonprm_wqe_segment_ctrl_mlx ctrl; + struct hermonprm_wqe_segment_data_ptr data[HERMON_MAX_GATHER]; + uint8_t headers[IB_MAX_HEADER_SIZE]; +} __attribute__ (( packed )); + +struct hermonprm_rc_send_wqe { + struct hermonprm_wqe_segment_ctrl_send ctrl; + struct hermonprm_wqe_segment_data_ptr data[HERMON_MAX_GATHER]; +} __attribute__ (( packed )); + +#define HERMON_MAX_SCATTER 1 + +struct hermonprm_recv_wqe { + struct hermonprm_wqe_segment_data_ptr data[HERMON_MAX_SCATTER]; +} __attribute__ (( packed )); + +union hermonprm_completion_entry { + struct hermonprm_completion_queue_entry normal; + struct hermonprm_completion_with_error error; +} __attribute__ (( packed )); + +union hermonprm_event_entry { + struct hermonprm_event_queue_entry generic; + struct hermonprm_port_state_change_event port_state_change; +} __attribute__ (( packed )); + +union hermonprm_doorbell_register { + struct hermonprm_send_db_register send; + struct hermonprm_event_db_register event; + uint32_t dword[1]; +} __attribute__ (( packed )); + +union hermonprm_mad { + struct hermonprm_mad_ifc ifc; + union ib_mad mad; +} __attribute__ (( packed )); + +/* + * gPXE-specific definitions + * + */ + +/** Hermon device capabilitiess */ +struct hermon_dev_cap { + /** CMPT entry size */ + size_t cmpt_entry_size; + /** Number of reserved QPs */ + unsigned int reserved_qps; + /** QP context entry size */ + size_t qpc_entry_size; + /** Alternate path context entry size */ + size_t altc_entry_size; + /** Auxiliary context entry size */ + size_t auxc_entry_size; + /** Number of reserved SRQs */ + unsigned int reserved_srqs; + /** SRQ context entry size */ + size_t srqc_entry_size; + /** Number of reserved CQs */ + unsigned int reserved_cqs; + /** CQ context entry size */ + size_t cqc_entry_size; + /** Number of reserved EQs */ + unsigned int reserved_eqs; + /** EQ context entry size */ + size_t eqc_entry_size; + /** Number of reserved MTTs */ + unsigned int reserved_mtts; + /** MTT entry size */ + size_t mtt_entry_size; + /** Number of reserved MRWs */ + unsigned int reserved_mrws; + /** DMPT entry size */ + size_t dmpt_entry_size; + /** Number of reserved UARs */ + unsigned int reserved_uars; + /** Number of ports */ + unsigned int num_ports; + /** Dual-port different protocol */ + int dpdp; +}; + +/** Number of cMPT entries of each type */ +#define HERMON_CMPT_MAX_ENTRIES ( 1 << 24 ) + +/** Hermon ICM memory map entry */ +struct hermon_icm_map { + /** Offset (virtual address within ICM) */ + uint64_t offset; + /** Length */ + size_t len; +}; + +/** Discontiguous regions within Hermon ICM */ +enum hermon_icm_map_regions { + HERMON_ICM_QP_CMPT = 0, + HERMON_ICM_SRQ_CMPT, + HERMON_ICM_CQ_CMPT, + HERMON_ICM_EQ_CMPT, + HERMON_ICM_OTHER, + HERMON_ICM_NUM_REGIONS +}; + +/** UAR page for doorbell accesses + * + * Pages 0-127 are reserved for event queue doorbells only, so we use + * page 128. + */ +#define HERMON_UAR_NON_EQ_PAGE 128 + +/** Maximum number of allocatable MTT entries + * + * This is a policy decision, not a device limit. + */ +#define HERMON_MAX_MTTS 64 + +/** A Hermon MTT descriptor */ +struct hermon_mtt { + /** MTT offset */ + unsigned int mtt_offset; + /** Number of pages */ + unsigned int num_pages; + /** MTT base address */ + unsigned int mtt_base_addr; + /** Offset within page */ + unsigned int page_offset; +}; + +/** Alignment of Hermon send work queue entries */ +#define HERMON_SEND_WQE_ALIGN 128 + +/** A Hermon send work queue entry */ +union hermon_send_wqe { + struct hermonprm_wqe_segment_ctrl_send ctrl; + struct hermonprm_ud_send_wqe ud; + struct hermonprm_mlx_send_wqe mlx; + struct hermonprm_rc_send_wqe rc; + uint8_t force_align[HERMON_SEND_WQE_ALIGN]; +} __attribute__ (( packed )); + +/** A Hermon send work queue */ +struct hermon_send_work_queue { + /** Number of work queue entries, including headroom + * + * Hermon requires us to leave unused space within the send + * WQ, so we create a send WQ with more entries than are + * requested in the create_qp() call. + */ + unsigned int num_wqes; + /** Work queue entries */ + union hermon_send_wqe *wqe; + /** Size of work queue */ + size_t wqe_size; + /** Doorbell register */ + void *doorbell; +}; + +/** Alignment of Hermon receive work queue entries */ +#define HERMON_RECV_WQE_ALIGN 16 + +/** A Hermon receive work queue entry */ +union hermon_recv_wqe { + struct hermonprm_recv_wqe recv; + uint8_t force_align[HERMON_RECV_WQE_ALIGN]; +} __attribute__ (( packed )); + +/** A Hermon receive work queue */ +struct hermon_recv_work_queue { + /** Work queue entries */ + union hermon_recv_wqe *wqe; + /** Size of work queue */ + size_t wqe_size; + /** Doorbell */ + struct hermonprm_qp_db_record doorbell __attribute__ (( aligned (4) )); +}; + +/** Number of special queue pairs */ +#define HERMON_NUM_SPECIAL_QPS 8 + +/** Number of queue pairs reserved for the "special QP" block + * + * The special QPs must be within a contiguous block aligned on its + * own size. + */ +#define HERMON_RSVD_SPECIAL_QPS ( ( HERMON_NUM_SPECIAL_QPS << 1 ) - 1 ) + +/** Maximum number of allocatable queue pairs + * + * This is a policy decision, not a device limit. + */ +#define HERMON_MAX_QPS 8 + +/** Queue pair number randomisation mask */ +#define HERMON_QPN_RANDOM_MASK 0xfff000 + +/** Hermon queue pair state */ +enum hermon_queue_pair_state { + HERMON_QP_ST_RST = 0, + HERMON_QP_ST_INIT, + HERMON_QP_ST_RTR, + HERMON_QP_ST_RTS, +}; + +/** A Hermon queue pair */ +struct hermon_queue_pair { + /** Work queue buffer */ + void *wqe; + /** Size of work queue buffer */ + size_t wqe_size; + /** MTT descriptor */ + struct hermon_mtt mtt; + /** Send work queue */ + struct hermon_send_work_queue send; + /** Receive work queue */ + struct hermon_recv_work_queue recv; + /** Queue state */ + enum hermon_queue_pair_state state; +}; + +/** Maximum number of allocatable completion queues + * + * This is a policy decision, not a device limit. + */ +#define HERMON_MAX_CQS 8 + +/** A Hermon completion queue */ +struct hermon_completion_queue { + /** Completion queue entries */ + union hermonprm_completion_entry *cqe; + /** Size of completion queue */ + size_t cqe_size; + /** MTT descriptor */ + struct hermon_mtt mtt; + /** Doorbell */ + struct hermonprm_cq_db_record doorbell __attribute__ (( aligned (8) )); +}; + +/** Maximum number of allocatable event queues + * + * This is a policy decision, not a device limit. + */ +#define HERMON_MAX_EQS 8 + +/** A Hermon event queue */ +struct hermon_event_queue { + /** Event queue entries */ + union hermonprm_event_entry *eqe; + /** Size of event queue */ + size_t eqe_size; + /** MTT descriptor */ + struct hermon_mtt mtt; + /** Event queue number */ + unsigned long eqn; + /** Next event queue entry index */ + unsigned long next_idx; + /** Doorbell register */ + void *doorbell; +}; + +/** Number of event queue entries + * + * This is a policy decision. + */ +#define HERMON_NUM_EQES 4 + +/** A Hermon resource bitmask */ +typedef uint32_t hermon_bitmask_t; + +/** Size of a hermon resource bitmask */ +#define HERMON_BITMASK_SIZE(max_entries) \ + ( ( (max_entries) + ( 8 * sizeof ( hermon_bitmask_t ) ) - 1 ) / \ + ( 8 * sizeof ( hermon_bitmask_t ) ) ) + +/** A Hermon device */ +struct hermon { + /** PCI configuration registers */ + void *config; + /** PCI user Access Region */ + void *uar; + + /** Command toggle */ + unsigned int toggle; + /** Command input mailbox */ + void *mailbox_in; + /** Command output mailbox */ + void *mailbox_out; + + /** Firmware area in external memory */ + userptr_t firmware_area; + /** ICM map */ + struct hermon_icm_map icm_map[HERMON_ICM_NUM_REGIONS]; + /** ICM area */ + userptr_t icm; + + /** Event queue */ + struct hermon_event_queue eq; + /** Unrestricted LKey + * + * Used to get unrestricted memory access. + */ + unsigned long lkey; + + /** Completion queue in-use bitmask */ + hermon_bitmask_t cq_inuse[ HERMON_BITMASK_SIZE ( HERMON_MAX_CQS ) ]; + /** Queue pair in-use bitmask */ + hermon_bitmask_t qp_inuse[ HERMON_BITMASK_SIZE ( HERMON_MAX_QPS ) ]; + /** MTT entry in-use bitmask */ + hermon_bitmask_t mtt_inuse[ HERMON_BITMASK_SIZE ( HERMON_MAX_MTTS ) ]; + + /** Device capabilities */ + struct hermon_dev_cap cap; + /** Special QPN base */ + unsigned long special_qpn_base; + /** QPN base */ + unsigned long qpn_base; + + /** Infiniband devices */ + struct ib_device *ibdev[HERMON_MAX_PORTS]; +}; + +/** Global protection domain */ +#define HERMON_GLOBAL_PD 0x123456 + +/** Memory key prefix */ +#define HERMON_MKEY_PREFIX 0x77000000UL + +/* + * HCA commands + * + */ + +#define HERMON_HCR_BASE 0x80680 +#define HERMON_HCR_REG(x) ( HERMON_HCR_BASE + 4 * (x) ) +#define HERMON_HCR_MAX_WAIT_MS 2000 +#define HERMON_MBOX_ALIGN 4096 +#define HERMON_MBOX_SIZE 512 + +/* HCA command is split into + * + * bits 11:0 Opcode + * bit 12 Input uses mailbox + * bit 13 Output uses mailbox + * bits 22:14 Input parameter length (in dwords) + * bits 31:23 Output parameter length (in dwords) + * + * Encoding the information in this way allows us to cut out several + * parameters to the hermon_command() call. + */ +#define HERMON_HCR_IN_MBOX 0x00001000UL +#define HERMON_HCR_OUT_MBOX 0x00002000UL +#define HERMON_HCR_OPCODE( _command ) ( (_command) & 0xfff ) +#define HERMON_HCR_IN_LEN( _command ) ( ( (_command) >> 12 ) & 0x7fc ) +#define HERMON_HCR_OUT_LEN( _command ) ( ( (_command) >> 21 ) & 0x7fc ) + +/** Build HCR command from component parts */ +#define HERMON_HCR_INOUT_CMD( _opcode, _in_mbox, _in_len, \ + _out_mbox, _out_len ) \ + ( (_opcode) | \ + ( (_in_mbox) ? HERMON_HCR_IN_MBOX : 0 ) | \ + ( ( (_in_len) / 4 ) << 14 ) | \ + ( (_out_mbox) ? HERMON_HCR_OUT_MBOX : 0 ) | \ + ( ( (_out_len) / 4 ) << 23 ) ) + +#define HERMON_HCR_IN_CMD( _opcode, _in_mbox, _in_len ) \ + HERMON_HCR_INOUT_CMD ( _opcode, _in_mbox, _in_len, 0, 0 ) + +#define HERMON_HCR_OUT_CMD( _opcode, _out_mbox, _out_len ) \ + HERMON_HCR_INOUT_CMD ( _opcode, 0, 0, _out_mbox, _out_len ) + +#define HERMON_HCR_VOID_CMD( _opcode ) \ + HERMON_HCR_INOUT_CMD ( _opcode, 0, 0, 0, 0 ) + +#endif /* _HERMON_H */ |