summaryrefslogtreecommitdiffstats
path: root/src
diff options
context:
space:
mode:
authorMichael Brown2016-03-09 01:27:15 +0100
committerMichael Brown2016-03-09 09:46:24 +0100
commite44f6dcb8994a3c5c29b16aacd97ac095f4588c6 (patch)
tree57b7610a6447d6a28ef5be1f786b48217ef507d4 /src
parent[eoib] Support non-FullMember gateway devices (diff)
downloadipxe-e44f6dcb8994a3c5c29b16aacd97ac095f4588c6.tar.gz
ipxe-e44f6dcb8994a3c5c29b16aacd97ac095f4588c6.tar.xz
ipxe-e44f6dcb8994a3c5c29b16aacd97ac095f4588c6.zip
[xsigo] Add support for Xsigo virtual Ethernet (XVE) EoIB devices
Add support for EoIB devices as implemented by Xsigo. Based on the public (but out-of-tree) Linux kernel drivers at https://oss.oracle.com/git/?p=linux-uek.git;a=log;h=v4.1.12-32.2.1 Signed-off-by: Michael Brown <mcb30@ipxe.org>
Diffstat (limited to 'src')
-rw-r--r--src/config/config_infiniband.c3
-rw-r--r--src/config/general.h1
-rw-r--r--src/include/ipxe/errfile.h1
-rw-r--r--src/include/ipxe/xsigo.h406
-rw-r--r--src/net/infiniband/xsigo.c1858
5 files changed, 2269 insertions, 0 deletions
diff --git a/src/config/config_infiniband.c b/src/config/config_infiniband.c
index 9bac3b7c..4da8fe21 100644
--- a/src/config/config_infiniband.c
+++ b/src/config/config_infiniband.c
@@ -44,6 +44,9 @@ REQUIRE_OBJECT ( ib_srp );
#ifdef VNIC_IPOIB
REQUIRE_OBJECT ( ipoib );
#endif
+#ifdef VNIC_XSIGO
+REQUIRE_OBJECT ( xsigo );
+#endif
/*
* Drag in Infiniband-specific commands
diff --git a/src/config/general.h b/src/config/general.h
index 9c433039..e9b781fb 100644
--- a/src/config/general.h
+++ b/src/config/general.h
@@ -158,6 +158,7 @@ FILE_LICENCE ( GPL2_OR_LATER_OR_UBDL );
*
*/
#define VNIC_IPOIB /* Infiniband IPoIB virtual NICs */
+//#define VNIC_XSIGO /* Infiniband Xsigo virtual NICs */
/*
* Error message tables to include
diff --git a/src/include/ipxe/errfile.h b/src/include/ipxe/errfile.h
index e64ccc39..4129861a 100644
--- a/src/include/ipxe/errfile.h
+++ b/src/include/ipxe/errfile.h
@@ -259,6 +259,7 @@ FILE_LICENCE ( GPL2_OR_LATER_OR_UBDL );
#define ERRFILE_peerdisc ( ERRFILE_NET | 0x00450000 )
#define ERRFILE_peerblk ( ERRFILE_NET | 0x00460000 )
#define ERRFILE_peermux ( ERRFILE_NET | 0x00470000 )
+#define ERRFILE_xsigo ( ERRFILE_NET | 0x00480000 )
#define ERRFILE_image ( ERRFILE_IMAGE | 0x00000000 )
#define ERRFILE_elf ( ERRFILE_IMAGE | 0x00010000 )
diff --git a/src/include/ipxe/xsigo.h b/src/include/ipxe/xsigo.h
new file mode 100644
index 00000000..f4f14c48
--- /dev/null
+++ b/src/include/ipxe/xsigo.h
@@ -0,0 +1,406 @@
+#ifndef _IPXE_XSIGO_H
+#define _IPXE_XSIGO_H
+
+/** @file
+ *
+ * Xsigo virtual Ethernet devices
+ *
+ */
+
+FILE_LICENCE ( GPL2_OR_LATER_OR_UBDL );
+
+#include <stdint.h>
+#include <ipxe/infiniband.h>
+#include <ipxe/eoib.h>
+
+/** Xsigo directory service record name */
+#define XDS_SERVICE_NAME "XSIGOXDS"
+
+/** Xsigo configuration manager service ID */
+#define XCM_SERVICE_ID { 0x00, 0x00, 0x00, 0x00, 0x02, 0x13, 0x97, 0x01 }
+
+/** Xsigo management class */
+#define XSIGO_MGMT_CLASS 0x0b
+
+/** Xsigo management class version */
+#define XSIGO_MGMT_CLASS_VERSION 2
+
+/** Xsigo configuration manager request MAD */
+#define XSIGO_ATTR_XCM_REQUEST 0xb002
+
+/** Generic operating system type */
+#define XSIGO_OS_TYPE_GENERIC 0x40
+
+/** Xsigo virtual Ethernet broadcast GID prefix */
+#define XVE_PREFIX 0xff15101cUL
+
+/** Xsigo resource types */
+enum xsigo_resource_type {
+ /** Virtual Ethernet resource type */
+ XSIGO_RESOURCE_XVE = ( 1 << 6 ),
+ /** Absence-of-high-availability "resource" type */
+ XSIGO_RESOURCE_NO_HA = ( 1 << 4 ),
+};
+
+/** A Xsigo server identifier */
+struct xsigo_server_id {
+ /** Virtual machine ID */
+ uint32_t vm;
+ /** Port GUID */
+ union ib_guid guid;
+} __attribute__ (( packed ));
+
+/** A Xsigo configuration manager identifier */
+struct xsigo_manager_id {
+ /** Port GUID */
+ union ib_guid guid;
+ /** LID */
+ uint16_t lid;
+ /** Reserved */
+ uint8_t reserved[10];
+} __attribute__ (( packed ));
+
+/** A Xsigo configuration manager request MAD */
+struct xsigo_managers_request {
+ /** MAD header */
+ struct ib_mad_hdr mad_hdr;
+ /** Reserved */
+ uint8_t reserved0[32];
+ /** Server ID */
+ struct xsigo_server_id server;
+ /** Hostname */
+ char hostname[ 65 /* Seriously, guys? */ ];
+ /** OS version */
+ char os_version[32];
+ /** CPU architecture */
+ char arch[16];
+ /** OS type */
+ uint8_t os_type;
+ /** Reserved */
+ uint8_t reserved1[3];
+ /** Firmware version */
+ uint64_t firmware_version;
+ /** Hardware version */
+ uint32_t hardware_version;
+ /** Driver version */
+ uint32_t driver_version;
+ /** System ID */
+ union ib_gid system_id;
+ /** Resource types */
+ uint16_t resources;
+ /** Reserved */
+ uint8_t reserved2[2];
+ /** Build version */
+ char build[16];
+ /** Reserved */
+ uint8_t reserved3[19];
+} __attribute__ (( packed ));
+
+/** Resource types are present */
+#define XSIGO_RESOURCES_PRESENT 0x8000
+
+/** A Xsigo configuration manager reply MAD */
+struct xsigo_managers_reply {
+ /** MAD header */
+ struct ib_mad_hdr mad_hdr;
+ /** Reserved */
+ uint8_t reserved0[32];
+ /** Server ID */
+ struct xsigo_server_id server;
+ /** Number of XCM records */
+ uint8_t count;
+ /** Version */
+ uint8_t version;
+ /** Reserved */
+ uint8_t reserved1[2];
+ /** Managers */
+ struct xsigo_manager_id manager[8];
+ /** Reserved */
+ uint8_t reserved2[24];
+} __attribute__ (( packed ));
+
+/** A Xsigo MAD */
+union xsigo_mad {
+ /** Generic MAD */
+ union ib_mad mad;
+ /** Configuration manager request */
+ struct xsigo_managers_request request;
+ /** Configuration manager reply */
+ struct xsigo_managers_reply reply;
+} __attribute__ (( packed ));
+
+/** An XSMP node identifier */
+struct xsmp_node_id {
+ /** Auxiliary ID (never used) */
+ uint32_t aux;
+ /** Port GUID */
+ union ib_guid guid;
+} __attribute__ (( packed ));
+
+/** An XSMP message header */
+struct xsmp_message_header {
+ /** Message type */
+ uint8_t type;
+ /** Reason code */
+ uint8_t code;
+ /** Length */
+ uint16_t len;
+ /** Sequence number */
+ uint32_t seq;
+ /** Source node ID */
+ struct xsmp_node_id src;
+ /** Destination node ID */
+ struct xsmp_node_id dst;
+} __attribute__ (( packed ));
+
+/** XSMP message types */
+enum xsmp_message_type {
+ /** Session message type */
+ XSMP_TYPE_SESSION = 1,
+ /** Virtual Ethernet message type */
+ XSMP_TYPE_XVE = 6,
+};
+
+/** An XSMP session message */
+struct xsmp_session_message {
+ /** Message header */
+ struct xsmp_message_header hdr;
+ /** Message type */
+ uint8_t type;
+ /** Reason code */
+ uint8_t code;
+ /** Length (excluding message header) */
+ uint16_t len;
+ /** Operating system type */
+ uint8_t os_type;
+ /** Reserved */
+ uint8_t reserved0;
+ /** Resource types */
+ uint16_t resources;
+ /** Driver version */
+ uint32_t driver_version;
+ /** Required chassis version */
+ uint32_t chassis_version;
+ /** Boot flags */
+ uint32_t boot;
+ /** Firmware version */
+ uint64_t firmware_version;
+ /** Hardware version */
+ uint32_t hardware_version;
+ /** Vendor part ID */
+ uint32_t vendor;
+ /** Protocol version */
+ uint32_t xsmp_version;
+ /** Chassis name */
+ char chassis[32];
+ /** Session name */
+ char session[32];
+ /** Reserved */
+ uint8_t reserved1[120];
+} __attribute__ (( packed ));
+
+/** XSMP session message types */
+enum xsmp_session_type {
+ /** Keepalive message */
+ XSMP_SESSION_TYPE_HELLO = 1,
+ /** Initial registration message */
+ XSMP_SESSION_TYPE_REGISTER = 2,
+ /** Registration confirmation message */
+ XSMP_SESSION_TYPE_CONFIRM = 3,
+ /** Registration rejection message */
+ XSMP_SESSION_TYPE_REJECT = 4,
+ /** Shutdown message */
+ XSMP_SESSION_TYPE_SHUTDOWN = 5,
+};
+
+/** XSMP boot flags */
+enum xsmp_session_boot {
+ /** PXE boot */
+ XSMP_BOOT_PXE = ( 1 << 0 ),
+};
+
+/** XSMP virtual Ethernet channel adapter parameters */
+struct xsmp_xve_ca {
+ /** Subnet prefix (little-endian) */
+ union ib_guid prefix_le;
+ /** Control queue pair number */
+ uint32_t ctrl;
+ /** Data queue pair number */
+ uint32_t data;
+ /** Partition key */
+ uint16_t pkey;
+ /** Queue key */
+ uint16_t qkey;
+} __attribute__ (( packed ));
+
+/** XSMP virtual Ethernet MAC address */
+struct xsmp_xve_mac {
+ /** High 16 bits */
+ uint16_t high;
+ /** Low 32 bits */
+ uint32_t low;
+} __attribute__ (( packed ));
+
+/** An XSMP virtual Ethernet message */
+struct xsmp_xve_message {
+ /** Message header */
+ struct xsmp_message_header hdr;
+ /** Message type */
+ uint8_t type;
+ /** Reason code */
+ uint8_t code;
+ /** Length (excluding message header) */
+ uint16_t len;
+ /** Update bitmask */
+ uint32_t update;
+ /** Resource identifier */
+ union ib_guid resource;
+ /** TCA GUID (little-endian) */
+ union ib_guid guid_le;
+ /** TCA LID */
+ uint16_t lid;
+ /** MAC address (little-endian) */
+ struct xsmp_xve_mac mac_le;
+ /** Rate */
+ uint16_t rate;
+ /** Administrative state (non-zero = "up") */
+ uint16_t state;
+ /** Encapsulation (apparently obsolete and unused) */
+ uint16_t encap;
+ /** MTU */
+ uint16_t mtu;
+ /** Installation flags (apparently obsolete and unused) */
+ uint32_t install;
+ /** Interface name */
+ char name[16];
+ /** Service level */
+ uint16_t sl;
+ /** Flow control enabled (apparently obsolete and unused) */
+ uint16_t flow;
+ /** Committed rate (in Mbps) */
+ uint16_t committed_mbps;
+ /** Peak rate (in Mbps) */
+ uint16_t peak_mbps;
+ /** Committed burst size (in bytes) */
+ uint32_t committed_burst;
+ /** Peak burst size (in bytes) */
+ uint32_t peak_burst;
+ /** VMware index */
+ uint8_t vmware;
+ /** Reserved */
+ uint8_t reserved0;
+ /** Multipath flags */
+ uint16_t multipath;
+ /** Multipath group name */
+ char group[48];
+ /** Link aggregation flag */
+ uint8_t agg;
+ /** Link aggregation policy */
+ uint8_t policy;
+ /** Network ID */
+ uint32_t network;
+ /** Mode */
+ uint8_t mode;
+ /** Uplink type */
+ uint8_t uplink;
+ /** Target channel adapter parameters */
+ struct xsmp_xve_ca tca;
+ /** Host channel adapter parameters */
+ struct xsmp_xve_ca hca;
+ /** Reserved */
+ uint8_t reserved1[336];
+} __attribute__ (( packed ));
+
+/** XSMP virtual Ethernet message types */
+enum xsmp_xve_type {
+ /** Install virtual NIC */
+ XSMP_XVE_TYPE_INSTALL = 1,
+ /** Delete virtual NIC */
+ XSMP_XVE_TYPE_DELETE = 2,
+ /** Update virtual NIC */
+ XSMP_XVE_TYPE_UPDATE = 3,
+ /** Set operational state up */
+ XSMP_XVE_TYPE_OPER_UP = 6,
+ /** Set operational state down */
+ XSMP_XVE_TYPE_OPER_DOWN = 7,
+ /** Get operational state */
+ XSMP_XVE_TYPE_OPER_REQ = 15,
+ /** Virtual NIC is ready */
+ XSMP_XVE_TYPE_READY = 20,
+};
+
+/** XSMP virtual Ethernet message codes */
+enum xsmp_xve_code {
+ /* Something went wrong */
+ XSMP_XVE_CODE_ERROR = 0x84,
+};
+
+/** XSMP virtual Ethernet update bitmask */
+enum xsmp_xve_update {
+ /** Update MTU */
+ XSMP_XVE_UPDATE_MTU = ( 1 << 2 ),
+ /** Update administrative state */
+ XSMP_XVE_UPDATE_STATE = ( 1 << 6 ),
+ /** Update gateway to mark as down */
+ XSMP_XVE_UPDATE_GW_DOWN = ( 1 << 30 ),
+ /** Update gateway information */
+ XSMP_XVE_UPDATE_GW_CHANGE = ( 1 << 31 ),
+};
+
+/** XSMP virtual Ethernet modes */
+enum xsmp_xve_mode {
+ /** Reliable Connected */
+ XSMP_XVE_MODE_RC = 1,
+ /** Unreliable Datagram */
+ XSMP_XVE_MODE_UD = 2,
+};
+
+/** XSMP virtual Ethernet uplink types */
+enum xsmp_xve_uplink {
+ /** No uplink */
+ XSMP_XVE_NO_UPLINK = 1,
+ /** Has uplink */
+ XSMP_XVE_UPLINK = 2,
+};
+
+/** An XSMP message */
+union xsmp_message {
+ /** Message header */
+ struct xsmp_message_header hdr;
+ /** Session message */
+ struct xsmp_session_message sess;
+ /** Virtual Ethernet message */
+ struct xsmp_xve_message xve;
+};
+
+/** Delay between attempts to open the Infiniband device
+ *
+ * This is a policy decision.
+ */
+#define XSIGO_OPEN_RETRY_DELAY ( 2 * TICKS_PER_SEC )
+
+/** Delay between unsuccessful discovery attempts
+ *
+ * This is a policy decision.
+ */
+#define XSIGO_DISCOVERY_FAILURE_DELAY ( 10 * TICKS_PER_SEC )
+
+/** Delay between successful discovery attempts
+ *
+ * This is a policy decision.
+ */
+#define XSIGO_DISCOVERY_SUCCESS_DELAY ( 20 * TICKS_PER_SEC )
+
+/** Delay between keepalive requests
+ *
+ * This is a policy decision.
+ */
+#define XSIGO_KEEPALIVE_INTERVAL ( 10 * TICKS_PER_SEC )
+
+/** Maximum time to wait for a keepalive response
+ *
+ * This is a policy decision.
+ */
+#define XSIGO_KEEPALIVE_MAX_WAIT ( 2 * TICKS_PER_SEC )
+
+#endif /* _IPXE_XSIGO_H */
diff --git a/src/net/infiniband/xsigo.c b/src/net/infiniband/xsigo.c
new file mode 100644
index 00000000..91b7b71f
--- /dev/null
+++ b/src/net/infiniband/xsigo.c
@@ -0,0 +1,1858 @@
+/*
+ * Copyright (C) 2016 Michael Brown <mbrown@fensystems.co.uk>.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License as
+ * published by the Free Software Foundation; either version 2 of the
+ * License, or any later version.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
+ * 02110-1301, USA.
+ *
+ * You can also choose to distribute this program under the terms of
+ * the Unmodified Binary Distribution Licence (as given in the file
+ * COPYING.UBDL), provided that you have satisfied its requirements.
+ */
+
+FILE_LICENCE ( GPL2_OR_LATER_OR_UBDL );
+
+#include <string.h>
+#include <stdio.h>
+#include <errno.h>
+#include <byteswap.h>
+#include <ipxe/version.h>
+#include <ipxe/timer.h>
+#include <ipxe/malloc.h>
+#include <ipxe/iobuf.h>
+#include <ipxe/retry.h>
+#include <ipxe/process.h>
+#include <ipxe/settings.h>
+#include <ipxe/infiniband.h>
+#include <ipxe/ib_service.h>
+#include <ipxe/ib_cmrc.h>
+#include <ipxe/if_ether.h>
+#include <ipxe/ethernet.h>
+#include <ipxe/eoib.h>
+#include <ipxe/xsigo.h>
+
+/** @file
+ *
+ * Xsigo virtual Ethernet devices
+ *
+ */
+
+/** A Xsigo device */
+struct xsigo_device {
+ /** Reference count */
+ struct refcnt refcnt;
+ /** Underlying Infiniband device */
+ struct ib_device *ibdev;
+ /** List of Xsigo devices */
+ struct list_head list;
+ /** Device name */
+ const char *name;
+
+ /** Link opener timer */
+ struct retry_timer opener;
+
+ /** Discovery timer */
+ struct retry_timer discovery;
+ /** Discovery management transaction (if any) */
+ struct ib_mad_transaction *madx;
+
+ /** List of configuration managers */
+ struct list_head managers;
+};
+
+/** A Xsigo configuration manager */
+struct xsigo_manager {
+ /** Reference count */
+ struct refcnt refcnt;
+ /** Xsigo device */
+ struct xsigo_device *xdev;
+ /** List of managers */
+ struct list_head list;
+ /** Device name */
+ char name[16];
+ /** Manager ID */
+ struct xsigo_manager_id id;
+
+ /** Data transfer interface */
+ struct interface xfer;
+ /** Connection timer */
+ struct retry_timer reopen;
+ /** Keepalive timer */
+ struct retry_timer keepalive;
+ /** Transmission process */
+ struct process process;
+ /** Pending transmissions */
+ unsigned int pending;
+ /** Transmit sequence number */
+ uint32_t seq;
+
+ /** List of virtual Ethernet devices */
+ struct list_head nics;
+};
+
+/** Configuration manager pending transmissions */
+enum xsigo_manager_pending {
+ /** Send connection request */
+ XCM_TX_CONNECT = 0x0001,
+ /** Send registration message */
+ XCM_TX_REGISTER = 0x0002,
+};
+
+/** A Xsigo virtual Ethernet device */
+struct xsigo_nic {
+ /** Configuration manager */
+ struct xsigo_manager *xcm;
+ /** List of virtual Ethernet devices */
+ struct list_head list;
+ /** Device name */
+ char name[16];
+
+ /** Resource identifier */
+ union ib_guid resource;
+ /** MAC address */
+ uint8_t mac[ETH_ALEN];
+ /** Network ID */
+ unsigned long network;
+};
+
+/** Configuration manager service ID */
+static union ib_guid xcm_service_id = {
+ .bytes = XCM_SERVICE_ID,
+};
+
+/** List of all Xsigo devices */
+static LIST_HEAD ( xsigo_devices );
+
+/**
+ * Free Xsigo device
+ *
+ * @v refcnt Reference count
+ */
+static void xsigo_free ( struct refcnt *refcnt ) {
+ struct xsigo_device *xdev =
+ container_of ( refcnt, struct xsigo_device, refcnt );
+
+ /* Sanity checks */
+ assert ( ! timer_running ( &xdev->opener ) );
+ assert ( ! timer_running ( &xdev->discovery ) );
+ assert ( xdev->madx == NULL );
+ assert ( list_empty ( &xdev->managers ) );
+
+ /* Drop reference to Infiniband device */
+ ibdev_put ( xdev->ibdev );
+
+ /* Free device */
+ free ( xdev );
+}
+
+/**
+ * Free configuration manager
+ *
+ * @v refcnt Reference count
+ */
+static void xcm_free ( struct refcnt *refcnt ) {
+ struct xsigo_manager *xcm =
+ container_of ( refcnt, struct xsigo_manager, refcnt );
+
+ /* Sanity checks */
+ assert ( ! timer_running ( &xcm->reopen ) );
+ assert ( ! timer_running ( &xcm->keepalive ) );
+ assert ( ! process_running ( &xcm->process ) );
+ assert ( list_empty ( &xcm->nics ) );
+
+ /* Drop reference to Xsigo device */
+ ref_put ( &xcm->xdev->refcnt );
+
+ /* Free manager */
+ free ( xcm );
+}
+
+/****************************************************************************
+ *
+ * Virtual Ethernet (XVE) devices
+ *
+ ****************************************************************************
+ */
+
+/**
+ * Create virtual Ethernet device
+ *
+ * @v xcm Configuration manager
+ * @v resource Resource identifier
+ * @v mac Ethernet MAC
+ * @v network Network identifier
+ * @v name Device name
+ * @ret rc Return status code
+ */
+static int xve_create ( struct xsigo_manager *xcm, union ib_guid *resource,
+ const uint8_t *mac, unsigned long network,
+ unsigned long qkey, const char *name ) {
+ struct xsigo_device *xdev = xcm->xdev;
+ struct ib_device *ibdev = xdev->ibdev;
+ struct xsigo_nic *xve;
+ struct ib_address_vector broadcast;
+ int rc;
+
+ /* Allocate and initialise structure */
+ xve = zalloc ( sizeof ( *xve ) );
+ if ( ! xve ) {
+ rc = -ENOMEM;
+ goto err_alloc;
+ }
+ xve->xcm = xcm;
+ snprintf ( xve->name, sizeof ( xve->name ), "%s", name );
+ memcpy ( &xve->resource, resource, sizeof ( xve->resource ) );
+ memcpy ( xve->mac, mac, ETH_ALEN );
+ xve->network = network;
+ DBGC ( xve, "XVE %s created for %s " IB_GUID_FMT "\n",
+ xve->name, xcm->name, IB_GUID_ARGS ( resource ) );
+ DBGC ( xve, "XVE %s is MAC %s on network %ld\n",
+ xve->name, eth_ntoa ( mac ), network );
+
+ /* Construct broadcast address vector */
+ memset ( &broadcast, 0, sizeof ( broadcast ) );
+ broadcast.qpn = IB_QPN_BROADCAST;
+ broadcast.qkey = qkey;
+ broadcast.gid_present = 1;
+ broadcast.gid.dwords[0] = htonl ( XVE_PREFIX );
+ broadcast.gid.words[2] = htons ( ibdev->pkey );
+ broadcast.gid.dwords[3] = htonl ( network );
+
+ /* Create EoIB device */
+ if ( ( rc = eoib_create ( ibdev, xve->mac, &broadcast,
+ xve->name ) ) != 0 ) {
+ DBGC ( xve, "XVE %s could not create EoIB device: %s\n",
+ xve->name, strerror ( rc ) );
+ goto err_create;
+ }
+
+ /* Add to list of virtual Ethernet devices. Do this only
+ * after creating the EoIB device, so that our net device
+ * notifier won't attempt to send an operational state update
+ * before we have acknowledged the installation.
+ */
+ list_add ( &xve->list, &xcm->nics );
+
+ return 0;
+
+ list_del ( &xve->list );
+ err_create:
+ free ( xve );
+ err_alloc:
+ return rc;
+}
+
+/**
+ * Find virtual Ethernet device
+ *
+ * @v xcm Configuration manager
+ * @v resource Resource identifier
+ * @ret xve Virtual Ethernet device, or NULL
+ */
+static struct xsigo_nic * xve_find ( struct xsigo_manager *xcm,
+ union ib_guid *resource ) {
+ struct xsigo_nic *xve;
+
+ list_for_each_entry ( xve, &xcm->nics, list ) {
+ if ( memcmp ( resource, &xve->resource,
+ sizeof ( *resource ) ) == 0 )
+ return xve;
+ }
+ return NULL;
+}
+
+/**
+ * Destroy virtual Ethernet device
+ *
+ * @v xve Virtual Ethernet device
+ */
+static void xve_destroy ( struct xsigo_nic *xve ) {
+ struct xsigo_manager *xcm = xve->xcm;
+ struct xsigo_device *xdev = xcm->xdev;
+ struct ib_device *ibdev = xdev->ibdev;
+ struct eoib_device *eoib;
+
+ /* Destroy corresponding EoIB device, if any */
+ if ( ( eoib = eoib_find ( ibdev, xve->mac ) ) )
+ eoib_destroy ( eoib );
+
+ /* Remove from list of virtual Ethernet devices */
+ list_del ( &xve->list );
+
+ /* Free virtual Ethernet device */
+ DBGC ( xve, "XVE %s destroyed\n", xve->name );
+ free ( xve );
+}
+
+/**
+ * Update virtual Ethernet device MTU
+ *
+ * @v xve Virtual Ethernet device
+ * @v eoib EoIB device
+ * @v mtu New MTU (excluding Ethernet and EoIB headers)
+ * @ret rc Return status code
+ */
+static int xve_update_mtu ( struct xsigo_nic *xve, struct eoib_device *eoib,
+ size_t mtu ) {
+ struct net_device *netdev = eoib->netdev;
+ size_t max;
+
+ /* Check that we can support this MTU */
+ max = ( IB_MAX_PAYLOAD_SIZE - ( sizeof ( struct ethhdr ) +
+ sizeof ( struct eoib_header ) ) );
+ if ( mtu > max ) {
+ DBGC ( xve, "XVE %s cannot support MTU %zd (max %zd)\n",
+ xve->name, mtu, max );
+ return -ERANGE;
+ }
+
+ /* Update MTU. No need to close/reopen the network device,
+ * since our Infiniband stack uses a fixed MTU anyway. Note
+ * that the network device sees the Ethernet frame header but
+ * not the EoIB header.
+ */
+ netdev->max_pkt_len = ( mtu + sizeof ( struct ethhdr ) );
+ DBGC ( xve, "XVE %s has MTU %zd\n", xve->name, mtu );
+
+ return 0;
+}
+
+/**
+ * Open virtual Ethernet device
+ *
+ * @v xve Virtual Ethernet device
+ * @v eoib EoIB device
+ * @v open New administrative state
+ * @ret rc Return status code
+ */
+static int xve_open ( struct xsigo_nic *xve, struct eoib_device *eoib ) {
+ struct net_device *netdev = eoib->netdev;
+ int rc;
+
+ /* Do nothing if network device is already open */
+ if ( netdev_is_open ( netdev ) )
+ return 0;
+ DBGC ( xve, "XVE %s opening network device\n", xve->name );
+
+ /* Open network device */
+ if ( ( rc = netdev_open ( netdev ) ) != 0 ) {
+ DBGC ( xve, "XVE %s could not open: %s\n",
+ xve->name, strerror ( rc ) );
+ return rc;
+ }
+
+ return 0;
+}
+
+/**
+ * Close virtual Ethernet device
+ *
+ * @v xve Virtual Ethernet device
+ * @v eoib EoIB device
+ */
+static void xve_close ( struct xsigo_nic *xve, struct eoib_device *eoib ) {
+ struct net_device *netdev = eoib->netdev;
+
+ /* Do nothing if network device is already closed */
+ if ( ! netdev_is_open ( netdev ) )
+ return;
+
+ /* Close network device */
+ netdev_close ( netdev );
+ DBGC ( xve, "XVE %s closed network device\n", xve->name );
+}
+
+/**
+ * Update virtual Ethernet device administrative state
+ *
+ * @v xve Virtual Ethernet device
+ * @v eoib EoIB device
+ * @v open New administrative state
+ * @ret rc Return status code
+ */
+static int xve_update_state ( struct xsigo_nic *xve, struct eoib_device *eoib,
+ int open ) {
+
+ /* Open or close device, as applicable */
+ if ( open ) {
+ return xve_open ( xve, eoib );
+ } else {
+ xve_close ( xve, eoib );
+ return 0;
+ }
+}
+
+/**
+ * Update gateway (TCA)
+ *
+ * @v xve Virtual Ethernet device
+ * @v eoib EoIB device
+ * @v av Address vector, or NULL if no gateway
+ * @ret rc Return status code
+ */
+static int xve_update_tca ( struct xsigo_nic *xve, struct eoib_device *eoib,
+ struct ib_address_vector *av ) {
+
+ /* Update gateway address */
+ eoib_set_gateway ( eoib, av );
+ if ( av ) {
+ DBGC ( xve, "XVE %s has TCA " IB_GID_FMT " data %#lx qkey "
+ "%#lx\n", xve->name, IB_GID_ARGS ( &av->gid ), av->qpn,
+ av->qkey );
+ } else {
+ DBGC ( xve, "XVE %s has no TCA\n", xve->name );
+ }
+
+ /* The Linux driver will modify the local device's link state
+ * to reflect the EoIB-to-Ethernet gateway's link state, but
+ * this seems philosophically incorrect since communication
+ * within the EoIB broadcast domain still works regardless of
+ * the state of the gateway.
+ */
+
+ return 0;
+}
+
+/****************************************************************************
+ *
+ * Server management protocol (XSMP) session messages
+ *
+ ****************************************************************************
+ */
+
+/**
+ * Get session message name (for debugging)
+ *
+ * @v type Message type
+ * @ret name Message name
+ */
+static const char * xsmp_session_type ( unsigned int type ) {
+ static char buf[16];
+
+ switch ( type ) {
+ case XSMP_SESSION_TYPE_HELLO: return "HELLO";
+ case XSMP_SESSION_TYPE_REGISTER: return "REGISTER";
+ case XSMP_SESSION_TYPE_CONFIRM: return "CONFIRM";
+ case XSMP_SESSION_TYPE_REJECT: return "REJECT";
+ case XSMP_SESSION_TYPE_SHUTDOWN: return "SHUTDOWN";
+ default:
+ snprintf ( buf, sizeof ( buf ), "UNKNOWN<%d>", type );
+ return buf;
+ }
+}
+
+/**
+ * Extract chassis name (for debugging)
+ *
+ * @v msg Session message
+ * @ret chassis Chassis name
+ */
+static const char * xsmp_chassis_name ( struct xsmp_session_message *msg ) {
+ static char chassis[ sizeof ( msg->chassis ) + 1 /* NUL */ ];
+
+ memcpy ( chassis, msg->chassis, sizeof ( msg->chassis ) );
+ return chassis;
+}
+
+/**
+ * Extract session name (for debugging)
+ *
+ * @v msg Session message
+ * @ret session Session name
+ */
+static const char * xsmp_session_name ( struct xsmp_session_message *msg ) {
+ static char session[ sizeof ( msg->session ) + 1 /* NUL */ ];
+
+ memcpy ( session, msg->session, sizeof ( msg->session ) );
+ return session;
+}
+
+/**
+ * Send session message
+ *
+ * @v xcm Configuration manager
+ * @v type Message type
+ * @ret rc Return status code
+ */
+static int xsmp_tx_session ( struct xsigo_manager *xcm, unsigned int type ) {
+ struct xsigo_device *xdev = xcm->xdev;
+ struct ib_device *ibdev = xdev->ibdev;
+ struct xsmp_session_message msg;
+ int rc;
+
+ /* Construct session message */
+ memset ( &msg, 0, sizeof ( msg ) );
+ msg.hdr.type = XSMP_TYPE_SESSION;
+ msg.hdr.len = htons ( sizeof ( msg ) );
+ msg.hdr.seq = htonl ( ++xcm->seq );
+ memcpy ( &msg.hdr.src.guid, &ibdev->gid.s.guid,
+ sizeof ( msg.hdr.src.guid ) );
+ memcpy ( &msg.hdr.dst.guid, &xcm->id.guid,
+ sizeof ( msg.hdr.dst.guid ) );
+ msg.type = type;
+ msg.len = htons ( sizeof ( msg ) - sizeof ( msg.hdr ) );
+ msg.os_type = XSIGO_OS_TYPE_GENERIC;
+ msg.resources = htons ( XSIGO_RESOURCE_XVE |
+ XSIGO_RESOURCE_NO_HA );
+ msg.boot = htonl ( XSMP_BOOT_PXE );
+ DBGCP ( xcm, "XCM %s TX[%d] session %s\n", xcm->name,
+ ntohl ( msg.hdr.seq ), xsmp_session_type ( msg.type ) );
+ DBGCP_HDA ( xcm, 0, &msg, sizeof ( msg ) );
+
+ /* Send session message */
+ if ( ( rc = xfer_deliver_raw ( &xcm->xfer, &msg,
+ sizeof ( msg ) ) ) != 0 ) {
+ DBGC ( xcm, "XCM %s TX session %s failed: %s\n", xcm->name,
+ xsmp_session_type ( msg.type ), strerror ( rc ) );
+ return rc;
+ }
+
+ return 0;
+}
+
+/**
+ * Send registration message
+ *
+ * @v xcm Configuration manager
+ * @ret rc Return status code
+ */
+static inline int xsmp_tx_session_register ( struct xsigo_manager *xcm ) {
+
+ DBGC ( xcm, "XCM %s registering with " IB_GUID_FMT "\n",
+ xcm->name, IB_GUID_ARGS ( &xcm->id.guid ) );
+
+ /* Send registration message */
+ return xsmp_tx_session ( xcm, XSMP_SESSION_TYPE_REGISTER );
+}
+
+/**
+ * Send keepalive message
+ *
+ * @v xcm Configuration manager
+ * @ret rc Return status code
+ */
+static int xsmp_tx_session_hello ( struct xsigo_manager *xcm ) {
+
+ /* Send keepalive message */
+ return xsmp_tx_session ( xcm, XSMP_SESSION_TYPE_HELLO );
+}
+
+/**
+ * Handle received keepalive message
+ *
+ * @v xcm Configuration manager
+ * @v msg Keepalive message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_session_hello ( struct xsigo_manager *xcm,
+ struct xsmp_session_message *msg __unused ) {
+
+ /* Respond to keepalive message. Note that the XCM doesn't
+ * seem to actually ever send these.
+ */
+ return xsmp_tx_session_hello ( xcm );
+}
+
+/**
+ * Handle received registration confirmation message
+ *
+ * @v xcm Configuration manager
+ * @v msg Registration confirmation message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_session_confirm ( struct xsigo_manager *xcm,
+ struct xsmp_session_message *msg ) {
+
+ DBGC ( xcm, "XCM %s registered with \"%s\" as \"%s\"\n", xcm->name,
+ xsmp_chassis_name ( msg ), xsmp_session_name ( msg ) );
+
+ return 0;
+}
+
+/**
+ * Handle received registration rejection message
+ *
+ * @v xcm Configuration manager
+ * @v msg Registration confirmation message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_session_reject ( struct xsigo_manager *xcm,
+ struct xsmp_session_message *msg ) {
+
+ DBGC ( xcm, "XCM %s rejected by \"%s\":\n",
+ xcm->name, xsmp_chassis_name ( msg ) );
+ DBGC_HDA ( xcm, 0, msg, sizeof ( *msg ) );
+
+ return -EPERM;
+}
+
+/**
+ * Handle received shutdown message
+ *
+ * @v xcm Configuration manager
+ * @v msg Registration confirmation message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_session_shutdown ( struct xsigo_manager *xcm,
+ struct xsmp_session_message *msg ) {
+
+ DBGC ( xcm, "XCM %s shut down by \"%s\":\n",
+ xcm->name, xsmp_chassis_name ( msg ) );
+ DBGC_HDA ( xcm, 0, msg, sizeof ( *msg ) );
+
+ return -ENOTCONN;
+}
+
+/**
+ * Handle received session message
+ *
+ * @v xcm Configuration manager
+ * @v msg Session message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_session ( struct xsigo_manager *xcm,
+ struct xsmp_session_message *msg ) {
+
+ DBGCP ( xcm, "XCM %s RX[%d] session %s\n", xcm->name,
+ ntohl ( msg->hdr.seq ), xsmp_session_type ( msg->type ) );
+ DBGCP_HDA ( xcm, 0, msg, sizeof ( *msg ) );
+
+ /* Handle message according to type */
+ switch ( msg->type ) {
+ case XSMP_SESSION_TYPE_HELLO:
+ return xsmp_rx_session_hello ( xcm, msg );
+ case XSMP_SESSION_TYPE_CONFIRM:
+ return xsmp_rx_session_confirm ( xcm, msg );
+ case XSMP_SESSION_TYPE_REJECT:
+ return xsmp_rx_session_reject ( xcm, msg );
+ case XSMP_SESSION_TYPE_SHUTDOWN:
+ return xsmp_rx_session_shutdown ( xcm, msg );
+ default:
+ DBGC ( xcm, "XCM %s RX[%d] session unexpected %s:\n", xcm->name,
+ ntohl ( msg->hdr.seq ), xsmp_session_type ( msg->type ));
+ DBGC_HDA ( xcm, 0, msg, sizeof ( *msg ) );
+ return -EPROTO;
+ }
+}
+
+/****************************************************************************
+ *
+ * Server management protocol (XSMP) virtual Ethernet (XVE) messages
+ *
+ ****************************************************************************
+ */
+
+/**
+ * Get virtual Ethernet message name (for debugging)
+ *
+ * @v type Message type
+ * @ret name Message name
+ */
+static const char * xsmp_xve_type ( unsigned int type ) {
+ static char buf[16];
+
+ switch ( type ) {
+ case XSMP_XVE_TYPE_INSTALL: return "INSTALL";
+ case XSMP_XVE_TYPE_DELETE: return "DELETE";
+ case XSMP_XVE_TYPE_UPDATE: return "UPDATE";
+ case XSMP_XVE_TYPE_OPER_UP: return "OPER_UP";
+ case XSMP_XVE_TYPE_OPER_DOWN: return "OPER_DOWN";
+ case XSMP_XVE_TYPE_OPER_REQ: return "OPER_REQ";
+ case XSMP_XVE_TYPE_READY: return "READY";
+ default:
+ snprintf ( buf, sizeof ( buf ), "UNKNOWN<%d>", type );
+ return buf;
+ }
+}
+
+/**
+ * Send virtual Ethernet message
+ *
+ * @v xcm Configuration manager
+ * @v msg Partial message
+ * @ret rc Return status code
+ */
+static int xsmp_tx_xve ( struct xsigo_manager *xcm,
+ struct xsmp_xve_message *msg ) {
+ struct xsigo_device *xdev = xcm->xdev;
+ struct ib_device *ibdev = xdev->ibdev;
+ int rc;
+
+ /* Fill in common header fields */
+ msg->hdr.type = XSMP_TYPE_XVE;
+ msg->hdr.len = htons ( sizeof ( *msg ) );
+ msg->hdr.seq = htonl ( ++xcm->seq );
+ memcpy ( &msg->hdr.src.guid, &ibdev->gid.s.guid,
+ sizeof ( msg->hdr.src.guid ) );
+ memcpy ( &msg->hdr.dst.guid, &xcm->id.guid,
+ sizeof ( msg->hdr.dst.guid ) );
+ msg->len = htons ( sizeof ( *msg ) - sizeof ( msg->hdr ) );
+ DBGCP ( xcm, "XCM %s TX[%d] xve %s code %#02x\n", xcm->name,
+ ntohl ( msg->hdr.seq ), xsmp_xve_type ( msg->type ),
+ msg->code );
+ DBGCP_HDA ( xcm, 0, msg, sizeof ( *msg ) );
+
+ /* Send virtual Ethernet message */
+ if ( ( rc = xfer_deliver_raw ( &xcm->xfer, msg,
+ sizeof ( *msg ) ) ) != 0 ) {
+ DBGC ( xcm, "XCM %s TX xve %s failed: %s\n", xcm->name,
+ xsmp_xve_type ( msg->type ), strerror ( rc ) );
+ return rc;
+ }
+
+ return 0;
+}
+
+/**
+ * Send virtual Ethernet message including current device parameters
+ *
+ * @v xcm Configuration manager
+ * @v msg Partial virtual Ethernet message
+ * @v xve Virtual Ethernet device
+ * @v eoib EoIB device
+ * @ret rc Return status code
+ */
+static int xsmp_tx_xve_params ( struct xsigo_manager *xcm,
+ struct xsmp_xve_message *msg,
+ struct xsigo_nic *xve,
+ struct eoib_device *eoib ) {
+ struct xsigo_device *xdev = xcm->xdev;
+ struct ib_device *ibdev = xdev->ibdev;
+ struct net_device *netdev = eoib->netdev;
+
+ /* Set successful response code */
+ msg->code = 0;
+
+ /* Include network identifier, MTU, and current HCA parameters */
+ msg->network = htonl ( xve->network );
+ msg->mtu = htons ( netdev->max_pkt_len - sizeof ( struct ethhdr ) );
+ msg->hca.prefix_le.qword = bswap_64 ( ibdev->gid.s.prefix.qword );
+ msg->hca.pkey = htons ( ibdev->pkey );
+ msg->hca.qkey = msg->tca.qkey;
+ if ( eoib->qp ) {
+ msg->hca.data = htonl ( eoib->qp->ext_qpn );
+ msg->hca.qkey = htons ( eoib->qp->qkey );
+ }
+
+ /* The message type field is (ab)used to return the current
+ * operational status.
+ */
+ if ( msg->type == XSMP_XVE_TYPE_OPER_REQ ) {
+ msg->type = ( netdev_is_open ( netdev ) ?
+ XSMP_XVE_TYPE_OPER_UP : XSMP_XVE_TYPE_OPER_DOWN );
+ }
+
+ /* Send message */
+ DBGC ( xve, "XVE %s network %d MTU %d ctrl %#x data %#x qkey %#04x "
+ "%s\n", xve->name, ntohl ( msg->network ), ntohs ( msg->mtu ),
+ ntohl ( msg->hca.ctrl ), ntohl ( msg->hca.data ),
+ ntohs ( msg->hca.qkey ), xsmp_xve_type ( msg->type ) );
+
+ return xsmp_tx_xve ( xcm, msg );
+}
+
+/**
+ * Send virtual Ethernet error response
+ *
+ * @v xcm Configuration manager
+ * @v msg Partial virtual Ethernet message
+ * @ret rc Return status code
+ */
+static inline int xsmp_tx_xve_nack ( struct xsigo_manager *xcm,
+ struct xsmp_xve_message *msg ) {
+
+ /* Set error response code. (There aren't any meaningful
+ * detailed response codes defined by the wire protocol.)
+ */
+ msg->code = XSMP_XVE_CODE_ERROR;
+
+ /* Send message */
+ return xsmp_tx_xve ( xcm, msg );
+}
+
+/**
+ * Send virtual Ethernet notification
+ *
+ * @v xcm Configuration manager
+ * @v type Message type
+ * @v xve Virtual Ethernet device
+ * @v eoib EoIB device
+ * @ret rc Return status code
+ */
+static int xsmp_tx_xve_notify ( struct xsigo_manager *xcm,
+ unsigned int type,
+ struct xsigo_nic *xve,
+ struct eoib_device *eoib ) {
+ struct xsmp_xve_message msg;
+
+ /* Construct message */
+ memset ( &msg, 0, sizeof ( msg ) );
+ msg.type = type;
+ memcpy ( &msg.resource, &xve->resource, sizeof ( msg.resource ) );
+
+ /* Send message */
+ return xsmp_tx_xve_params ( xcm, &msg, xve, eoib );
+}
+
+/**
+ * Send virtual Ethernet current operational state
+ *
+ * @v xcm Configuration manager
+ * @v xve Virtual Ethernet device
+ * @v eoib EoIB device
+ * @ret rc Return status code
+ */
+static inline int xsmp_tx_xve_oper ( struct xsigo_manager *xcm,
+ struct xsigo_nic *xve,
+ struct eoib_device *eoib ) {
+
+ /* Send notification */
+ return xsmp_tx_xve_notify ( xcm, XSMP_XVE_TYPE_OPER_REQ, xve, eoib );
+}
+
+/**
+ * Handle received virtual Ethernet modification message
+ *
+ * @v xcm Configuration manager
+ * @v msg Virtual Ethernet message
+ * @v update Update bitmask
+ * @ret rc Return status code
+ */
+static int xsmp_rx_xve_modify ( struct xsigo_manager *xcm,
+ struct xsmp_xve_message *msg,
+ unsigned int update ) {
+ struct xsigo_device *xdev = xcm->xdev;
+ struct ib_device *ibdev = xdev->ibdev;
+ struct xsigo_nic *xve;
+ struct eoib_device *eoib;
+ struct ib_address_vector tca;
+ size_t mtu;
+ int rc;
+
+ /* Avoid returning uninitialised HCA parameters in response */
+ memset ( &msg->hca, 0, sizeof ( msg->hca ) );
+
+ /* Find virtual Ethernet device */
+ xve = xve_find ( xcm, &msg->resource );
+ if ( ! xve ) {
+ DBGC ( xcm, "XCM %s unrecognised resource " IB_GUID_FMT "\n",
+ xcm->name, IB_GUID_ARGS ( &msg->resource ) );
+ rc = -ENOENT;
+ goto err_no_xve;
+ }
+
+ /* Find corresponding EoIB device */
+ eoib = eoib_find ( ibdev, xve->mac );
+ if ( ! eoib ) {
+ DBGC ( xve, "XVE %s has no EoIB device\n", xve->name );
+ rc = -EPIPE;
+ goto err_no_eoib;
+ }
+
+ /* The Xsigo management software fails to create the EoIB
+ * multicast group. This is a fundamental design flaw.
+ */
+ eoib_force_group_creation ( eoib );
+
+ /* Extract modifiable parameters. Note that the TCA GID is
+ * erroneously transmitted as little-endian.
+ */
+ mtu = ntohs ( msg->mtu );
+ tca.qpn = ntohl ( msg->tca.data );
+ tca.qkey = ntohs ( msg->tca.qkey );
+ tca.gid_present = 1;
+ tca.gid.s.prefix.qword = bswap_64 ( msg->tca.prefix_le.qword );
+ tca.gid.s.guid.qword = bswap_64 ( msg->guid_le.qword );
+
+ /* Update MTU, if applicable */
+ if ( ( update & XSMP_XVE_UPDATE_MTU ) &&
+ ( ( rc = xve_update_mtu ( xve, eoib, mtu ) ) != 0 ) )
+ goto err_mtu;
+ update &= ~XSMP_XVE_UPDATE_MTU;
+
+ /* Update admin state, if applicable */
+ if ( ( update & XSMP_XVE_UPDATE_STATE ) &&
+ ( ( rc = xve_update_state ( xve, eoib, msg->state ) ) != 0 ) )
+ goto err_state;
+ update &= ~XSMP_XVE_UPDATE_STATE;
+
+ /* Remove gateway, if applicable */
+ if ( ( update & XSMP_XVE_UPDATE_GW_DOWN ) &&
+ ( ( rc = xve_update_tca ( xve, eoib, NULL ) ) != 0 ) )
+ goto err_gw_down;
+ update &= ~XSMP_XVE_UPDATE_GW_DOWN;
+
+ /* Update gateway, if applicable */
+ if ( ( update & XSMP_XVE_UPDATE_GW_CHANGE ) &&
+ ( ( rc = xve_update_tca ( xve, eoib, &tca ) ) != 0 ) )
+ goto err_gw_change;
+ update &= ~XSMP_XVE_UPDATE_GW_CHANGE;
+
+ /* Warn about unexpected updates */
+ if ( update ) {
+ DBGC ( xve, "XVE %s unrecognised update(s) %#08x\n",
+ xve->name, update );
+ }
+
+ xsmp_tx_xve_params ( xcm, msg, xve, eoib );
+ return 0;
+
+ err_gw_change:
+ err_gw_down:
+ err_state:
+ err_mtu:
+ err_no_eoib:
+ err_no_xve:
+ /* Send NACK */
+ xsmp_tx_xve_nack ( xcm, msg );
+ return rc;
+}
+
+/**
+ * Handle received virtual Ethernet installation message
+ *
+ * @v xcm Configuration manager
+ * @v msg Virtual Ethernet message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_xve_install ( struct xsigo_manager *xcm,
+ struct xsmp_xve_message *msg ) {
+ union {
+ struct xsmp_xve_mac msg;
+ uint8_t raw[ETH_ALEN];
+ } mac;
+ char name[ sizeof ( msg->name ) + 1 /* NUL */ ];
+ unsigned long network;
+ unsigned long qkey;
+ unsigned int update;
+ int rc;
+
+ /* Demangle MAC address (which is erroneously transmitted as
+ * little-endian).
+ */
+ mac.msg.high = bswap_16 ( msg->mac_le.high );
+ mac.msg.low = bswap_32 ( msg->mac_le.low );
+
+ /* Extract interface name (which may not be NUL-terminated) */
+ memcpy ( name, msg->name, ( sizeof ( name ) - 1 /* NUL */ ) );
+ name[ sizeof ( name ) - 1 /* NUL */ ] = '\0';
+
+ /* Extract remaining message parameters */
+ network = ntohl ( msg->network );
+ qkey = ntohs ( msg->tca.qkey );
+ DBGC2 ( xcm, "XCM %s " IB_GUID_FMT " install \"%s\" %s net %ld qkey "
+ "%#lx\n", xcm->name, IB_GUID_ARGS ( &msg->resource ), name,
+ eth_ntoa ( mac.raw ), network, qkey );
+
+ /* Create virtual Ethernet device, if applicable */
+ if ( ( xve_find ( xcm, &msg->resource ) == NULL ) &&
+ ( ( rc = xve_create ( xcm, &msg->resource, mac.raw, network,
+ qkey, name ) ) != 0 ) )
+ goto err_create;
+
+ /* Handle remaining parameters as for a modification message */
+ update = XSMP_XVE_UPDATE_MTU;
+ if ( msg->uplink == XSMP_XVE_UPLINK )
+ update |= XSMP_XVE_UPDATE_GW_CHANGE;
+ return xsmp_rx_xve_modify ( xcm, msg, update );
+
+ err_create:
+ /* Send NACK */
+ xsmp_tx_xve_nack ( xcm, msg );
+ return rc;
+}
+
+/**
+ * Handle received virtual Ethernet deletion message
+ *
+ * @v xcm Configuration manager
+ * @v msg Virtual Ethernet message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_xve_delete ( struct xsigo_manager *xcm,
+ struct xsmp_xve_message *msg ) {
+ struct xsigo_nic *xve;
+
+ DBGC2 ( xcm, "XCM %s " IB_GUID_FMT " delete\n",
+ xcm->name, IB_GUID_ARGS ( &msg->resource ) );
+
+ /* Destroy virtual Ethernet device (if any) */
+ if ( ( xve = xve_find ( xcm, &msg->resource ) ) )
+ xve_destroy ( xve );
+
+ /* Send ACK */
+ msg->code = 0;
+ xsmp_tx_xve ( xcm, msg );
+
+ return 0;
+}
+
+/**
+ * Handle received virtual Ethernet update message
+ *
+ * @v xcm Configuration manager
+ * @v msg Virtual Ethernet message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_xve_update ( struct xsigo_manager *xcm,
+ struct xsmp_xve_message *msg ) {
+ unsigned int update = ntohl ( msg->update );
+
+ DBGC2 ( xcm, "XCM %s " IB_GUID_FMT " update (%08x)\n",
+ xcm->name, IB_GUID_ARGS ( &msg->resource ), update );
+
+ /* Handle as a modification message */
+ return xsmp_rx_xve_modify ( xcm, msg, update );
+}
+
+/**
+ * Handle received virtual Ethernet operational request message
+ *
+ * @v xcm Configuration manager
+ * @v msg Virtual Ethernet message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_xve_oper_req ( struct xsigo_manager *xcm,
+ struct xsmp_xve_message *msg ) {
+
+ DBGC2 ( xcm, "XCM %s " IB_GUID_FMT " operational request\n",
+ xcm->name, IB_GUID_ARGS ( &msg->resource ) );
+
+ /* Handle as a nullipotent modification message */
+ return xsmp_rx_xve_modify ( xcm, msg, 0 );
+}
+
+/**
+ * Handle received virtual Ethernet readiness message
+ *
+ * @v xcm Configuration manager
+ * @v msg Virtual Ethernet message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_xve_ready ( struct xsigo_manager *xcm,
+ struct xsmp_xve_message *msg ) {
+ int rc;
+
+ DBGC2 ( xcm, "XCM %s " IB_GUID_FMT " ready\n",
+ xcm->name, IB_GUID_ARGS ( &msg->resource ) );
+
+ /* Handle as a nullipotent modification message */
+ if ( ( rc = xsmp_rx_xve_modify ( xcm, msg, 0 ) ) != 0 )
+ return rc;
+
+ /* Send an unsolicited operational state update, since there
+ * is no other way to convey the current operational state.
+ */
+ msg->type = XSMP_XVE_TYPE_OPER_REQ;
+ if ( ( rc = xsmp_rx_xve_modify ( xcm, msg, 0 ) ) != 0 )
+ return rc;
+
+ return 0;
+}
+
+/**
+ * Handle received virtual Ethernet message
+ *
+ * @v xcm Configuration manager
+ * @v msg Virtual Ethernet message
+ * @ret rc Return status code
+ */
+static int xsmp_rx_xve ( struct xsigo_manager *xcm,
+ struct xsmp_xve_message *msg ) {
+
+ DBGCP ( xcm, "XCM %s RX[%d] xve %s\n", xcm->name,
+ ntohl ( msg->hdr.seq ), xsmp_xve_type ( msg->type ) );
+ DBGCP_HDA ( xcm, 0, msg, sizeof ( *msg ) );
+
+ /* Handle message according to type */
+ switch ( msg->type ) {
+ case XSMP_XVE_TYPE_INSTALL:
+ return xsmp_rx_xve_install ( xcm, msg );
+ case XSMP_XVE_TYPE_DELETE:
+ return xsmp_rx_xve_delete ( xcm, msg );
+ case XSMP_XVE_TYPE_UPDATE:
+ return xsmp_rx_xve_update ( xcm, msg );
+ case XSMP_XVE_TYPE_OPER_REQ:
+ return xsmp_rx_xve_oper_req ( xcm, msg );
+ case XSMP_XVE_TYPE_READY:
+ return xsmp_rx_xve_ready ( xcm, msg );
+ default:
+ DBGC ( xcm, "XCM %s RX[%d] xve unexpected %s:\n", xcm->name,
+ ntohl ( msg->hdr.seq ), xsmp_xve_type ( msg->type ) );
+ DBGC_HDA ( xcm, 0, msg, sizeof ( *msg ) );
+ return -EPROTO;
+ }
+}
+
+/****************************************************************************
+ *
+ * Configuration managers (XCM)
+ *
+ ****************************************************************************
+ */
+
+/**
+ * Close configuration manager connection
+ *
+ * @v xcm Configuration manager
+ * @v rc Reason for close
+ */
+static void xcm_close ( struct xsigo_manager *xcm, int rc ) {
+
+ DBGC ( xcm, "XCM %s closed: %s\n", xcm->name, strerror ( rc ) );
+
+ /* Stop transmission process */
+ process_del ( &xcm->process );
+
+ /* Stop keepalive timer */
+ stop_timer ( &xcm->keepalive );
+
+ /* Restart data transfer interface */
+ intf_restart ( &xcm->xfer, rc );
+
+ /* Schedule reconnection attempt */
+ start_timer ( &xcm->reopen );
+}
+
+/**
+ * Send data to configuration manager
+ *
+ * @v xcm Configuration manager
+ */
+static void xcm_step ( struct xsigo_manager *xcm ) {
+ int rc;
+
+ /* Do nothing unless we have something to send */
+ if ( ! xcm->pending )
+ return;
+
+ /* Send (empty) connection request, if applicable */
+ if ( xcm->pending & XCM_TX_CONNECT ) {
+ if ( ( rc = xfer_deliver_raw ( &xcm->xfer, NULL, 0 ) ) != 0 ) {
+ DBGC ( xcm, "XCM %s could not send connection request: "
+ "%s\n", xcm->name, strerror ( rc ) );
+ goto err;
+ }
+ xcm->pending &= ~XCM_TX_CONNECT;
+ return;
+ }
+
+ /* Wait until data transfer interface is connected */
+ if ( ! xfer_window ( &xcm->xfer ) )
+ return;
+
+ /* Send registration message, if applicable */
+ if ( xcm->pending & XCM_TX_REGISTER ) {
+ if ( ( rc = xsmp_tx_session_register ( xcm ) ) != 0 )
+ goto err;
+ xcm->pending &= ~XCM_TX_REGISTER;
+ return;
+ }
+
+ return;
+
+ err:
+ xcm_close ( xcm, rc );
+}
+
+/**
+ * Receive data from configuration manager
+ *
+ * @v xcm Configuration manager
+ * @v iobuf I/O buffer
+ * @v meta Data transfer metadata
+ * @ret rc Return status code
+ */
+static int xcm_deliver ( struct xsigo_manager *xcm, struct io_buffer *iobuf,
+ struct xfer_metadata *meta __unused ) {
+ union xsmp_message *msg;
+ size_t len = iob_len ( iobuf );
+ int rc;
+
+ /* Sanity check */
+ if ( len < sizeof ( msg->hdr ) ) {
+ DBGC ( xcm, "XCM %s underlength message:\n", xcm->name );
+ DBGC_HDA ( xcm, 0, iobuf->data, iob_len ( iobuf ) );
+ rc = -EPROTO;
+ goto out;
+ }
+ msg = iobuf->data;
+
+ /* Handle message according to type */
+ if ( ! msg->hdr.type ) {
+
+ /* Ignore unused communication manager private data blocks */
+ rc = 0;
+
+ } else if ( ( msg->hdr.type == XSMP_TYPE_SESSION ) &&
+ ( len >= sizeof ( msg->sess ) ) ) {
+
+ /* Session message */
+ rc = xsmp_rx_session ( xcm, &msg->sess );
+
+ } else if ( ( msg->hdr.type == XSMP_TYPE_XVE ) &&
+ ( len >= sizeof ( msg->xve ) ) ) {
+
+ /* Virtual Ethernet message */
+ xsmp_rx_xve ( xcm, &msg->xve );
+
+ /* Virtual Ethernet message errors are non-fatal */
+ rc = 0;
+
+ } else {
+
+ /* Unknown message */
+ DBGC ( xcm, "XCM %s unexpected message type %d:\n",
+ xcm->name, msg->hdr.type );
+ DBGC_HDA ( xcm, 0, iobuf->data, iob_len ( iobuf ) );
+ rc = -EPROTO;
+ }
+
+ out:
+ free_iob ( iobuf );
+ if ( rc != 0 )
+ xcm_close ( xcm, rc );
+ return rc;
+}
+
+/** Configuration manager data transfer interface operations */
+static struct interface_operation xcm_xfer_op[] = {
+ INTF_OP ( xfer_deliver, struct xsigo_manager *, xcm_deliver ),
+ INTF_OP ( xfer_window_changed, struct xsigo_manager *, xcm_step ),
+ INTF_OP ( intf_close, struct xsigo_manager *, xcm_close ),
+};
+
+/** Configuration manager data transfer interface descriptor */
+static struct interface_descriptor xcm_xfer_desc =
+ INTF_DESC ( struct xsigo_manager, xfer, xcm_xfer_op );
+
+/** Configuration manager process descriptor */
+static struct process_descriptor xcm_process_desc =
+ PROC_DESC_ONCE ( struct xsigo_manager, process, xcm_step );
+
+/**
+ * Handle configuration manager connection timer expiry
+ *
+ * @v timer Connection timer
+ * @v fail Failure indicator
+ */
+static void xcm_reopen ( struct retry_timer *timer, int fail __unused ) {
+ struct xsigo_manager *xcm =
+ container_of ( timer, struct xsigo_manager, reopen );
+ struct xsigo_device *xdev = xcm->xdev;
+ struct ib_device *ibdev = xdev->ibdev;
+ union ib_gid gid;
+ int rc;
+
+ /* Stop transmission process */
+ process_del ( &xcm->process );
+
+ /* Stop keepalive timer */
+ stop_timer ( &xcm->keepalive );
+
+ /* Restart data transfer interface */
+ intf_restart ( &xcm->xfer, -ECANCELED );
+
+ /* Reset sequence number */
+ xcm->seq = 0;
+
+ /* Construct GID */
+ memcpy ( &gid.s.prefix, &ibdev->gid.s.prefix, sizeof ( gid.s.prefix ) );
+ memcpy ( &gid.s.guid, &xcm->id.guid, sizeof ( gid.s.guid ) );
+ DBGC ( xcm, "XCM %s connecting to " IB_GID_FMT "\n",
+ xcm->name, IB_GID_ARGS ( &gid ) );
+
+ /* Open CMRC connection */
+ if ( ( rc = ib_cmrc_open ( &xcm->xfer, ibdev, &gid,
+ &xcm_service_id, xcm->name ) ) != 0 ) {
+ DBGC ( xcm, "XCM %s could not open CMRC connection: %s\n",
+ xcm->name, strerror ( rc ) );
+ start_timer ( &xcm->reopen );
+ return;
+ }
+
+ /* Schedule transmissions */
+ xcm->pending |= ( XCM_TX_CONNECT | XCM_TX_REGISTER );
+ process_add ( &xcm->process );
+
+ /* Start keepalive timer */
+ start_timer_fixed ( &xcm->keepalive, XSIGO_KEEPALIVE_INTERVAL );
+
+ return;
+}
+
+/**
+ * Handle configuration manager keepalive timer expiry
+ *
+ * @v timer Connection timer
+ * @v fail Failure indicator
+ */
+static void xcm_keepalive ( struct retry_timer *timer, int fail __unused ) {
+ struct xsigo_manager *xcm =
+ container_of ( timer, struct xsigo_manager, keepalive );
+ int rc;
+
+ /* Send keepalive message. The server won't actually respond
+ * to these, but it gives the RC queue pair a chance to
+ * complain if it doesn't ever at least get an ACK.
+ */
+ if ( ( rc = xsmp_tx_session_hello ( xcm ) ) != 0 ) {
+ xcm_close ( xcm, rc );
+ return;
+ }
+
+ /* Restart keepalive timer */
+ start_timer_fixed ( &xcm->keepalive, XSIGO_KEEPALIVE_INTERVAL );
+}
+
+/**
+ * Create configuration manager
+ *
+ * @v xsigo Xsigo device
+ * @v id Configuration manager ID
+ * @ret rc Return status code
+ */
+static int xcm_create ( struct xsigo_device *xdev,
+ struct xsigo_manager_id *id ) {
+ struct xsigo_manager *xcm;
+
+ /* Allocate and initialise structure */
+ xcm = zalloc ( sizeof ( *xcm ) );
+ if ( ! xcm )
+ return -ENOMEM;
+ ref_init ( &xcm->refcnt, xcm_free );
+ xcm->xdev = xdev;
+ ref_get ( &xcm->xdev->refcnt );
+ snprintf ( xcm->name, sizeof ( xcm->name ), "%s:xcm-%d",
+ xdev->name, ntohs ( id->lid ) );
+ memcpy ( &xcm->id, id, sizeof ( xcm->id ) );
+ intf_init ( &xcm->xfer, &xcm_xfer_desc, &xcm->refcnt );
+ timer_init ( &xcm->keepalive, xcm_keepalive, &xcm->refcnt );
+ timer_init ( &xcm->reopen, xcm_reopen, &xcm->refcnt );
+ process_init_stopped ( &xcm->process, &xcm_process_desc, &xcm->refcnt );
+ INIT_LIST_HEAD ( &xcm->nics );
+
+ /* Start timer to open connection */
+ start_timer_nodelay ( &xcm->reopen );
+
+ /* Add to list of managers and transfer reference to list */
+ list_add ( &xcm->list, &xdev->managers );
+ DBGC ( xcm, "XCM %s created for " IB_GUID_FMT " (LID %d)\n", xcm->name,
+ IB_GUID_ARGS ( &xcm->id.guid ), ntohs ( id->lid ) );
+ return 0;
+}
+
+/**
+ * Find configuration manager
+ *
+ * @v xsigo Xsigo device
+ * @v id Configuration manager ID
+ * @ret xcm Configuration manager, or NULL
+ */
+static struct xsigo_manager * xcm_find ( struct xsigo_device *xdev,
+ struct xsigo_manager_id *id ) {
+ struct xsigo_manager *xcm;
+ union ib_guid *guid = &id->guid;
+
+ /* Find configuration manager */
+ list_for_each_entry ( xcm, &xdev->managers, list ) {
+ if ( memcmp ( guid, &xcm->id.guid, sizeof ( *guid ) ) == 0 )
+ return xcm;
+ }
+ return NULL;
+}
+
+/**
+ * Destroy configuration manager
+ *
+ * @v xcm Configuration manager
+ */
+static void xcm_destroy ( struct xsigo_manager *xcm ) {
+ struct xsigo_nic *xve;
+
+ /* Remove all EoIB NICs */
+ while ( ( xve = list_first_entry ( &xcm->nics, struct xsigo_nic,
+ list ) ) ) {
+ xve_destroy ( xve );
+ }
+
+ /* Stop transmission process */
+ process_del ( &xcm->process );
+
+ /* Stop timers */
+ stop_timer ( &xcm->keepalive );
+ stop_timer ( &xcm->reopen );
+
+ /* Shut down data transfer interface */
+ intf_shutdown ( &xcm->xfer, 0 );
+
+ /* Remove from list of managers and drop list's reference */
+ DBGC ( xcm, "XCM %s destroyed\n", xcm->name );
+ list_del ( &xcm->list );
+ ref_put ( &xcm->refcnt );
+}
+
+/**
+ * Synchronise list of configuration managers
+ *
+ * @v xdev Xsigo device
+ * @v ids List of manager IDs
+ * @v count Number of manager IDs
+ * @ret rc Return status code
+ */
+static int xcm_list ( struct xsigo_device *xdev, struct xsigo_manager_id *ids,
+ unsigned int count ) {
+ struct xsigo_manager_id *id;
+ struct xsigo_manager *xcm;
+ struct xsigo_manager *tmp;
+ struct list_head list;
+ unsigned int i;
+ int rc;
+
+ /* Create list of managers to be retained */
+ INIT_LIST_HEAD ( &list );
+ for ( i = 0, id = ids ; i < count ; i++, id++ ) {
+ if ( ( xcm = xcm_find ( xdev, id ) ) ) {
+ list_del ( &xcm->list );
+ list_add_tail ( &xcm->list, &list );
+ }
+ }
+
+ /* Destroy any managers not in the list */
+ list_for_each_entry_safe ( xcm, tmp, &xdev->managers, list )
+ xcm_destroy ( xcm );
+ list_splice ( &list, &xdev->managers );
+
+ /* Create any new managers in the list, and force reconnection
+ * for any changed LIDs.
+ */
+ for ( i = 0, id = ids ; i < count ; i++, id++ ) {
+ if ( ( xcm = xcm_find ( xdev, id ) ) ) {
+ if ( xcm->id.lid != id->lid )
+ start_timer_nodelay ( &xcm->reopen );
+ continue;
+ }
+ if ( ( rc = xcm_create ( xdev, id ) ) != 0 ) {
+ DBGC ( xdev, "XDEV %s could not create manager: %s\n",
+ xdev->name, strerror ( rc ) );
+ return rc;
+ }
+ }
+
+ return 0;
+}
+
+/****************************************************************************
+ *
+ * Configuration manager discovery
+ *
+ ****************************************************************************
+ */
+
+/** A stage of discovery */
+struct xsigo_discovery {
+ /** Name */
+ const char *name;
+ /** Management transaction operations */
+ struct ib_mad_transaction_operations op;
+};
+
+/**
+ * Handle configuration manager lookup completion
+ *
+ * @v ibdev Infiniband device
+ * @v mi Management interface
+ * @v madx Management transaction
+ * @v rc Status code
+ * @v mad Received MAD (or NULL on error)
+ * @v av Source address vector (or NULL on error)
+ */
+static void xsigo_xcm_complete ( struct ib_device *ibdev,
+ struct ib_mad_interface *mi __unused,
+ struct ib_mad_transaction *madx,
+ int rc, union ib_mad *mad,
+ struct ib_address_vector *av __unused ) {
+ struct xsigo_device *xdev = ib_madx_get_ownerdata ( madx );
+ union xsigo_mad *xsmad = container_of ( mad, union xsigo_mad, mad );
+ struct xsigo_managers_reply *reply = &xsmad->reply;
+
+ /* Check for failures */
+ if ( ( rc == 0 ) && ( mad->hdr.status != htons ( IB_MGMT_STATUS_OK ) ) )
+ rc = -ENODEV;
+ if ( rc != 0 ) {
+ DBGC ( xdev, "XDEV %s manager lookup failed: %s\n",
+ xdev->name, strerror ( rc ) );
+ goto out;
+ }
+
+ /* Sanity checks */
+ if ( reply->count > ( sizeof ( reply->manager ) /
+ sizeof ( reply->manager[0] ) ) ) {
+ DBGC ( xdev, "XDEV %s has too many managers (%d)\n",
+ xdev->name, reply->count );
+ goto out;
+ }
+
+ /* Synchronise list of managers */
+ if ( ( rc = xcm_list ( xdev, reply->manager, reply->count ) ) != 0 )
+ goto out;
+
+ /* Report an empty list of managers */
+ if ( reply->count == 0 )
+ DBGC ( xdev, "XDEV %s has no managers\n", xdev->name );
+
+ /* Delay next discovery attempt */
+ start_timer_fixed ( &xdev->discovery, XSIGO_DISCOVERY_SUCCESS_DELAY );
+
+out:
+ /* Destroy the completed transaction */
+ ib_destroy_madx ( ibdev, ibdev->gsi, madx );
+ xdev->madx = NULL;
+}
+
+/** Configuration manager lookup discovery stage */
+static struct xsigo_discovery xsigo_xcm_discovery = {
+ .name = "manager",
+ .op = {
+ .complete = xsigo_xcm_complete,
+ },
+};
+
+/**
+ * Handle directory service lookup completion
+ *
+ * @v ibdev Infiniband device
+ * @v mi Management interface
+ * @v madx Management transaction
+ * @v rc Status code
+ * @v mad Received MAD (or NULL on error)
+ * @v av Source address vector (or NULL on error)
+ */
+static void xsigo_xds_complete ( struct ib_device *ibdev,
+ struct ib_mad_interface *mi __unused,
+ struct ib_mad_transaction *madx,
+ int rc, union ib_mad *mad,
+ struct ib_address_vector *av __unused ) {
+ struct xsigo_device *xdev = ib_madx_get_ownerdata ( madx );
+ union xsigo_mad *xsmad = container_of ( mad, union xsigo_mad, mad );
+ struct xsigo_managers_request *request = &xsmad->request;
+ struct ib_service_record *svc;
+ struct ib_address_vector dest;
+ union ib_guid *guid;
+
+ /* Allow for reuse of transaction pointer */
+ xdev->madx = NULL;
+
+ /* Check for failures */
+ if ( ( rc == 0 ) && ( mad->hdr.status != htons ( IB_MGMT_STATUS_OK ) ) )
+ rc = -ENODEV;
+ if ( rc != 0 ) {
+ DBGC ( xdev, "XDEV %s directory lookup failed: %s\n",
+ xdev->name, strerror ( rc ) );
+ goto out;
+ }
+
+ /* Construct address vector */
+ memset ( &dest, 0, sizeof ( dest ) );
+ svc = &mad->sa.sa_data.service_record;
+ dest.lid = ntohs ( svc->data16[0] );
+ dest.sl = ibdev->sm_sl;
+ dest.qpn = IB_QPN_GSI;
+ dest.qkey = IB_QKEY_GSI;
+ guid = ( ( union ib_guid * ) &svc->data64[0] );
+ DBGC2 ( xdev, "XDEV %s found directory at LID %d GUID " IB_GUID_FMT
+ "\n", xdev->name, dest.lid, IB_GUID_ARGS ( guid ) );
+
+ /* Construct request (reusing MAD buffer) */
+ memset ( request, 0, sizeof ( *request ) );
+ request->mad_hdr.mgmt_class = XSIGO_MGMT_CLASS;
+ request->mad_hdr.class_version = XSIGO_MGMT_CLASS_VERSION;
+ request->mad_hdr.method = IB_MGMT_METHOD_GET;
+ request->mad_hdr.attr_id = htons ( XSIGO_ATTR_XCM_REQUEST );
+ memcpy ( &request->server.guid, &ibdev->gid.s.guid,
+ sizeof ( request->server.guid ) );
+ snprintf ( request->os_version, sizeof ( request->os_version ),
+ "%s %s", product_short_name, product_version );
+ snprintf ( request->arch, sizeof ( request->arch ), _S2 ( ARCH ) );
+ request->os_type = XSIGO_OS_TYPE_GENERIC;
+ request->resources = htons ( XSIGO_RESOURCES_PRESENT |
+ XSIGO_RESOURCE_XVE |
+ XSIGO_RESOURCE_NO_HA );
+
+ /* The handling of this request on the server side is a
+ * textbook example of how not to design a wire protocol. The
+ * server uses the _driver_ version number to determine which
+ * fields are present.
+ */
+ request->driver_version = htonl ( 0x2a2a2a );
+
+ /* The build version field is ignored unless it happens to
+ * contain the substring "xg-".
+ */
+ snprintf ( request->build, sizeof ( request->build ),
+ "not-xg-%08lx", build_id );
+
+ /* The server side user interface occasionally has no way to
+ * refer to an entry with an empty hostname.
+ */
+ fetch_string_setting ( NULL, &hostname_setting, request->hostname,
+ sizeof ( request->hostname ) );
+ if ( ! request->hostname[0] ) {
+ snprintf ( request->hostname, sizeof ( request->hostname ),
+ "%s-" IB_GUID_FMT, product_short_name,
+ IB_GUID_ARGS ( &ibdev->gid.s.guid ) );
+ }
+
+ /* Start configuration manager lookup */
+ xdev->madx = ib_create_madx ( ibdev, ibdev->gsi, mad, &dest,
+ &xsigo_xcm_discovery.op );
+ if ( ! xdev->madx ) {
+ DBGC ( xdev, "XDEV %s could not start manager lookup\n",
+ xdev->name );
+ goto out;
+ }
+ ib_madx_set_ownerdata ( xdev->madx, xdev );
+
+out:
+ /* Destroy the completed transaction */
+ ib_destroy_madx ( ibdev, ibdev->gsi, madx );
+}
+
+/** Directory service lookup discovery stage */
+static struct xsigo_discovery xsigo_xds_discovery = {
+ .name = "directory",
+ .op = {
+ .complete = xsigo_xds_complete,
+ },
+};
+
+/**
+ * Discover configuration managers
+ *
+ * @v timer Retry timer
+ * @v over Failure indicator
+ */
+static void xsigo_discover ( struct retry_timer *timer, int over __unused ) {
+ struct xsigo_device *xdev =
+ container_of ( timer, struct xsigo_device, discovery );
+ struct ib_device *ibdev = xdev->ibdev;
+ struct xsigo_discovery *discovery;
+
+ /* Restart timer */
+ start_timer_fixed ( &xdev->discovery, XSIGO_DISCOVERY_FAILURE_DELAY );
+
+ /* Cancel any pending discovery transaction */
+ if ( xdev->madx ) {
+ discovery = container_of ( xdev->madx->op,
+ struct xsigo_discovery, op );
+ DBGC ( xdev, "XDEV %s timed out waiting for %s lookup\n",
+ xdev->name, discovery->name );
+ ib_destroy_madx ( ibdev, ibdev->gsi, xdev->madx );
+ xdev->madx = NULL;
+ }
+
+ /* Start directory service lookup */
+ xdev->madx = ib_create_service_madx ( ibdev, ibdev->gsi,
+ XDS_SERVICE_NAME,
+ &xsigo_xds_discovery.op );
+ if ( ! xdev->madx ) {
+ DBGC ( xdev, "XDEV %s could not start directory lookup\n",
+ xdev->name );
+ return;
+ }
+ ib_madx_set_ownerdata ( xdev->madx, xdev );
+}
+
+/****************************************************************************
+ *
+ * Infiniband device driver
+ *
+ ****************************************************************************
+ */
+
+/**
+ * Open link and start discovery
+ *
+ * @v opener Link opener
+ * @v over Failure indicator
+ */
+static void xsigo_ib_open ( struct retry_timer *opener, int over __unused ) {
+ struct xsigo_device *xdev =
+ container_of ( opener, struct xsigo_device, opener );
+ struct ib_device *ibdev = xdev->ibdev;
+ int rc;
+
+ /* Open Infiniband device */
+ if ( ( rc = ib_open ( ibdev ) ) != 0 ) {
+ DBGC ( xdev, "XDEV %s could not open: %s\n",
+ xdev->name, strerror ( rc ) );
+ /* Delay and try again */
+ start_timer_fixed ( &xdev->opener, XSIGO_OPEN_RETRY_DELAY );
+ return;
+ }
+
+ /* If link is already up, then start discovery */
+ if ( ib_link_ok ( ibdev ) )
+ start_timer_nodelay ( &xdev->discovery );
+}
+
+/**
+ * Probe Xsigo device
+ *
+ * @v ibdev Infiniband device
+ * @ret rc Return status code
+ */
+static int xsigo_ib_probe ( struct ib_device *ibdev ) {
+ struct xsigo_device *xdev;
+
+ /* Allocate and initialise structure */
+ xdev = zalloc ( sizeof ( *xdev ) );
+ if ( ! xdev )
+ return -ENOMEM;
+ ref_init ( &xdev->refcnt, xsigo_free );
+ xdev->ibdev = ibdev_get ( ibdev );
+ xdev->name = ibdev->name;
+ timer_init ( &xdev->opener, xsigo_ib_open, &xdev->refcnt );
+ timer_init ( &xdev->discovery, xsigo_discover, &xdev->refcnt );
+ INIT_LIST_HEAD ( &xdev->managers );
+
+ /* Start timer to open Infiniband device. (We are currently
+ * within the Infiniband device probe callback list; opening
+ * the device here would have interesting side-effects.)
+ */
+ start_timer_nodelay ( &xdev->opener );
+
+ /* Add to list of devices and transfer reference to list */
+ list_add_tail ( &xdev->list, &xsigo_devices );
+ DBGC ( xdev, "XDEV %s created for " IB_GUID_FMT "\n",
+ xdev->name, IB_GUID_ARGS ( &ibdev->gid.s.guid ) );
+ return 0;
+}
+
+/**
+ * Handle device or link status change
+ *
+ * @v ibdev Infiniband device
+ */
+static void xsigo_ib_notify ( struct ib_device *ibdev ) {
+ struct xsigo_device *xdev;
+
+ /* Stop/restart discovery on any attached devices */
+ list_for_each_entry ( xdev, &xsigo_devices, list ) {
+
+ /* Skip non-attached devices */
+ if ( xdev->ibdev != ibdev )
+ continue;
+
+ /* Stop any ongoing discovery */
+ if ( xdev->madx ) {
+ ib_destroy_madx ( ibdev, ibdev->gsi, xdev->madx );
+ xdev->madx = NULL;
+ }
+ stop_timer ( &xdev->discovery );
+
+ /* If link is up, then start discovery */
+ if ( ib_link_ok ( ibdev ) )
+ start_timer_nodelay ( &xdev->discovery );
+ }
+}
+
+/**
+ * Remove Xsigo device
+ *
+ * @v ibdev Infiniband device
+ */
+static void xsigo_ib_remove ( struct ib_device *ibdev ) {
+ struct xsigo_device *xdev;
+ struct xsigo_device *tmp;
+
+ /* Remove any attached Xsigo devices */
+ list_for_each_entry_safe ( xdev, tmp, &xsigo_devices, list ) {
+
+ /* Skip non-attached devices */
+ if ( xdev->ibdev != ibdev )
+ continue;
+
+ /* Stop any ongoing discovery */
+ if ( xdev->madx ) {
+ ib_destroy_madx ( ibdev, ibdev->gsi, xdev->madx );
+ xdev->madx = NULL;
+ }
+ stop_timer ( &xdev->discovery );
+
+ /* Destroy all configuration managers */
+ xcm_list ( xdev, NULL, 0 );
+
+ /* Close Infiniband device, if applicable */
+ if ( ! timer_running ( &xdev->opener ) )
+ ib_close ( xdev->ibdev );
+
+ /* Stop link opener */
+ stop_timer ( &xdev->opener );
+
+ /* Remove from list of devices and drop list's reference */
+ DBGC ( xdev, "XDEV %s destroyed\n", xdev->name );
+ list_del ( &xdev->list );
+ ref_put ( &xdev->refcnt );
+ }
+}
+
+/** Xsigo Infiniband driver */
+struct ib_driver xsigo_ib_driver __ib_driver = {
+ .name = "Xsigo",
+ .probe = xsigo_ib_probe,
+ .notify = xsigo_ib_notify,
+ .remove = xsigo_ib_remove,
+};
+
+/****************************************************************************
+ *
+ * Network device driver
+ *
+ ****************************************************************************
+ */
+
+/**
+ * Handle device or link status change
+ *
+ * @v netdev Network device
+ */
+static void xsigo_net_notify ( struct net_device *netdev ) {
+ struct xsigo_device *xdev;
+ struct ib_device *ibdev;
+ struct xsigo_manager *xcm;
+ struct xsigo_nic *xve;
+ struct eoib_device *eoib;
+
+ /* Send current operational state to XCM, if applicable */
+ list_for_each_entry ( xdev, &xsigo_devices, list ) {
+ ibdev = xdev->ibdev;
+ list_for_each_entry ( xcm, &xdev->managers, list ) {
+ list_for_each_entry ( xve, &xcm->nics, list ) {
+ eoib = eoib_find ( ibdev, xve->mac );
+ if ( ! eoib )
+ continue;
+ if ( eoib->netdev != netdev )
+ continue;
+ xsmp_tx_xve_oper ( xcm, xve, eoib );
+ }
+ }
+ }
+}
+
+/** Xsigo network driver */
+struct net_driver xsigo_net_driver __net_driver = {
+ .name = "Xsigo",
+ .notify = xsigo_net_notify,
+};