388 строки
11 KiB
C
388 строки
11 KiB
C
/*
|
|
* net/tipc/ib_media.c: Infiniband bearer support for TIPC
|
|
*
|
|
* Copyright (c) 2013 Patrick McHardy <kaber@trash.net>
|
|
*
|
|
* Based on eth_media.c, which carries the following copyright notice:
|
|
*
|
|
* Copyright (c) 2001-2007, Ericsson AB
|
|
* Copyright (c) 2005-2008, 2011, Wind River Systems
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions are met:
|
|
*
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* 3. Neither the names of the copyright holders nor the names of its
|
|
* contributors may be used to endorse or promote products derived from
|
|
* this software without specific prior written permission.
|
|
*
|
|
* Alternatively, this software may be distributed under the terms of the
|
|
* GNU General Public License ("GPL") version 2 as published by the Free
|
|
* Software Foundation.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
* POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#include <linux/if_infiniband.h>
|
|
#include "core.h"
|
|
#include "bearer.h"
|
|
|
|
#define MAX_IB_BEARERS MAX_BEARERS
|
|
|
|
/**
|
|
* struct ib_bearer - Infiniband bearer data structure
|
|
* @bearer: ptr to associated "generic" bearer structure
|
|
* @dev: ptr to associated Infiniband network device
|
|
* @tipc_packet_type: used in binding TIPC to Infiniband driver
|
|
* @cleanup: work item used when disabling bearer
|
|
*/
|
|
|
|
struct ib_bearer {
|
|
struct tipc_bearer *bearer;
|
|
struct net_device *dev;
|
|
struct packet_type tipc_packet_type;
|
|
struct work_struct setup;
|
|
struct work_struct cleanup;
|
|
};
|
|
|
|
static struct tipc_media ib_media_info;
|
|
static struct ib_bearer ib_bearers[MAX_IB_BEARERS];
|
|
static int ib_started;
|
|
|
|
/**
|
|
* ib_media_addr_set - initialize Infiniband media address structure
|
|
*
|
|
* Media-dependent "value" field stores MAC address in first 6 bytes
|
|
* and zeroes out the remaining bytes.
|
|
*/
|
|
static void ib_media_addr_set(const struct tipc_bearer *tb_ptr,
|
|
struct tipc_media_addr *a, char *mac)
|
|
{
|
|
BUILD_BUG_ON(sizeof(a->value) < INFINIBAND_ALEN);
|
|
memcpy(a->value, mac, INFINIBAND_ALEN);
|
|
a->media_id = TIPC_MEDIA_TYPE_IB;
|
|
a->broadcast = !memcmp(mac, tb_ptr->bcast_addr.value, INFINIBAND_ALEN);
|
|
}
|
|
|
|
/**
|
|
* send_msg - send a TIPC message out over an InfiniBand interface
|
|
*/
|
|
static int send_msg(struct sk_buff *buf, struct tipc_bearer *tb_ptr,
|
|
struct tipc_media_addr *dest)
|
|
{
|
|
struct sk_buff *clone;
|
|
struct net_device *dev;
|
|
int delta;
|
|
|
|
clone = skb_clone(buf, GFP_ATOMIC);
|
|
if (!clone)
|
|
return 0;
|
|
|
|
dev = ((struct ib_bearer *)(tb_ptr->usr_handle))->dev;
|
|
delta = dev->hard_header_len - skb_headroom(buf);
|
|
|
|
if ((delta > 0) &&
|
|
pskb_expand_head(clone, SKB_DATA_ALIGN(delta), 0, GFP_ATOMIC)) {
|
|
kfree_skb(clone);
|
|
return 0;
|
|
}
|
|
|
|
skb_reset_network_header(clone);
|
|
clone->dev = dev;
|
|
clone->protocol = htons(ETH_P_TIPC);
|
|
dev_hard_header(clone, dev, ETH_P_TIPC, dest->value,
|
|
dev->dev_addr, clone->len);
|
|
dev_queue_xmit(clone);
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* recv_msg - handle incoming TIPC message from an InfiniBand interface
|
|
*
|
|
* Accept only packets explicitly sent to this node, or broadcast packets;
|
|
* ignores packets sent using InfiniBand multicast, and traffic sent to other
|
|
* nodes (which can happen if interface is running in promiscuous mode).
|
|
*/
|
|
static int recv_msg(struct sk_buff *buf, struct net_device *dev,
|
|
struct packet_type *pt, struct net_device *orig_dev)
|
|
{
|
|
struct ib_bearer *ib_ptr = (struct ib_bearer *)pt->af_packet_priv;
|
|
|
|
if (!net_eq(dev_net(dev), &init_net)) {
|
|
kfree_skb(buf);
|
|
return 0;
|
|
}
|
|
|
|
if (likely(ib_ptr->bearer)) {
|
|
if (likely(buf->pkt_type <= PACKET_BROADCAST)) {
|
|
buf->next = NULL;
|
|
tipc_recv_msg(buf, ib_ptr->bearer);
|
|
return 0;
|
|
}
|
|
}
|
|
kfree_skb(buf);
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* setup_bearer - setup association between InfiniBand bearer and interface
|
|
*/
|
|
static void setup_bearer(struct work_struct *work)
|
|
{
|
|
struct ib_bearer *ib_ptr =
|
|
container_of(work, struct ib_bearer, setup);
|
|
|
|
dev_add_pack(&ib_ptr->tipc_packet_type);
|
|
}
|
|
|
|
/**
|
|
* enable_bearer - attach TIPC bearer to an InfiniBand interface
|
|
*/
|
|
static int enable_bearer(struct tipc_bearer *tb_ptr)
|
|
{
|
|
struct net_device *dev = NULL;
|
|
struct net_device *pdev = NULL;
|
|
struct ib_bearer *ib_ptr = &ib_bearers[0];
|
|
struct ib_bearer *stop = &ib_bearers[MAX_IB_BEARERS];
|
|
char *driver_name = strchr((const char *)tb_ptr->name, ':') + 1;
|
|
int pending_dev = 0;
|
|
|
|
/* Find unused InfiniBand bearer structure */
|
|
while (ib_ptr->dev) {
|
|
if (!ib_ptr->bearer)
|
|
pending_dev++;
|
|
if (++ib_ptr == stop)
|
|
return pending_dev ? -EAGAIN : -EDQUOT;
|
|
}
|
|
|
|
/* Find device with specified name */
|
|
read_lock(&dev_base_lock);
|
|
for_each_netdev(&init_net, pdev) {
|
|
if (!strncmp(pdev->name, driver_name, IFNAMSIZ)) {
|
|
dev = pdev;
|
|
dev_hold(dev);
|
|
break;
|
|
}
|
|
}
|
|
read_unlock(&dev_base_lock);
|
|
if (!dev)
|
|
return -ENODEV;
|
|
|
|
/* Create InfiniBand bearer for device */
|
|
ib_ptr->dev = dev;
|
|
ib_ptr->tipc_packet_type.type = htons(ETH_P_TIPC);
|
|
ib_ptr->tipc_packet_type.dev = dev;
|
|
ib_ptr->tipc_packet_type.func = recv_msg;
|
|
ib_ptr->tipc_packet_type.af_packet_priv = ib_ptr;
|
|
INIT_LIST_HEAD(&(ib_ptr->tipc_packet_type.list));
|
|
INIT_WORK(&ib_ptr->setup, setup_bearer);
|
|
schedule_work(&ib_ptr->setup);
|
|
|
|
/* Associate TIPC bearer with InfiniBand bearer */
|
|
ib_ptr->bearer = tb_ptr;
|
|
tb_ptr->usr_handle = (void *)ib_ptr;
|
|
memset(tb_ptr->bcast_addr.value, 0, sizeof(tb_ptr->bcast_addr.value));
|
|
memcpy(tb_ptr->bcast_addr.value, dev->broadcast, INFINIBAND_ALEN);
|
|
tb_ptr->bcast_addr.media_id = TIPC_MEDIA_TYPE_IB;
|
|
tb_ptr->bcast_addr.broadcast = 1;
|
|
tb_ptr->mtu = dev->mtu;
|
|
tb_ptr->blocked = 0;
|
|
ib_media_addr_set(tb_ptr, &tb_ptr->addr, (char *)dev->dev_addr);
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* cleanup_bearer - break association between InfiniBand bearer and interface
|
|
*
|
|
* This routine must be invoked from a work queue because it can sleep.
|
|
*/
|
|
static void cleanup_bearer(struct work_struct *work)
|
|
{
|
|
struct ib_bearer *ib_ptr =
|
|
container_of(work, struct ib_bearer, cleanup);
|
|
|
|
dev_remove_pack(&ib_ptr->tipc_packet_type);
|
|
dev_put(ib_ptr->dev);
|
|
ib_ptr->dev = NULL;
|
|
}
|
|
|
|
/**
|
|
* disable_bearer - detach TIPC bearer from an InfiniBand interface
|
|
*
|
|
* Mark InfiniBand bearer as inactive so that incoming buffers are thrown away,
|
|
* then get worker thread to complete bearer cleanup. (Can't do cleanup
|
|
* here because cleanup code needs to sleep and caller holds spinlocks.)
|
|
*/
|
|
static void disable_bearer(struct tipc_bearer *tb_ptr)
|
|
{
|
|
struct ib_bearer *ib_ptr = (struct ib_bearer *)tb_ptr->usr_handle;
|
|
|
|
ib_ptr->bearer = NULL;
|
|
INIT_WORK(&ib_ptr->cleanup, cleanup_bearer);
|
|
schedule_work(&ib_ptr->cleanup);
|
|
}
|
|
|
|
/**
|
|
* recv_notification - handle device updates from OS
|
|
*
|
|
* Change the state of the InfiniBand bearer (if any) associated with the
|
|
* specified device.
|
|
*/
|
|
static int recv_notification(struct notifier_block *nb, unsigned long evt,
|
|
void *dv)
|
|
{
|
|
struct net_device *dev = (struct net_device *)dv;
|
|
struct ib_bearer *ib_ptr = &ib_bearers[0];
|
|
struct ib_bearer *stop = &ib_bearers[MAX_IB_BEARERS];
|
|
|
|
if (!net_eq(dev_net(dev), &init_net))
|
|
return NOTIFY_DONE;
|
|
|
|
while ((ib_ptr->dev != dev)) {
|
|
if (++ib_ptr == stop)
|
|
return NOTIFY_DONE; /* couldn't find device */
|
|
}
|
|
if (!ib_ptr->bearer)
|
|
return NOTIFY_DONE; /* bearer had been disabled */
|
|
|
|
ib_ptr->bearer->mtu = dev->mtu;
|
|
|
|
switch (evt) {
|
|
case NETDEV_CHANGE:
|
|
if (netif_carrier_ok(dev))
|
|
tipc_continue(ib_ptr->bearer);
|
|
else
|
|
tipc_block_bearer(ib_ptr->bearer->name);
|
|
break;
|
|
case NETDEV_UP:
|
|
tipc_continue(ib_ptr->bearer);
|
|
break;
|
|
case NETDEV_DOWN:
|
|
tipc_block_bearer(ib_ptr->bearer->name);
|
|
break;
|
|
case NETDEV_CHANGEMTU:
|
|
case NETDEV_CHANGEADDR:
|
|
tipc_block_bearer(ib_ptr->bearer->name);
|
|
tipc_continue(ib_ptr->bearer);
|
|
break;
|
|
case NETDEV_UNREGISTER:
|
|
case NETDEV_CHANGENAME:
|
|
tipc_disable_bearer(ib_ptr->bearer->name);
|
|
break;
|
|
}
|
|
return NOTIFY_OK;
|
|
}
|
|
|
|
static struct notifier_block notifier = {
|
|
.notifier_call = recv_notification,
|
|
.priority = 0,
|
|
};
|
|
|
|
/**
|
|
* ib_addr2str - convert InfiniBand address to string
|
|
*/
|
|
static int ib_addr2str(struct tipc_media_addr *a, char *str_buf, int str_size)
|
|
{
|
|
if (str_size < 60) /* 60 = 19 * strlen("xx:") + strlen("xx\0") */
|
|
return 1;
|
|
|
|
sprintf(str_buf, "%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x:"
|
|
"%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x:%02x",
|
|
a->value[0], a->value[1], a->value[2], a->value[3],
|
|
a->value[4], a->value[5], a->value[6], a->value[7],
|
|
a->value[8], a->value[9], a->value[10], a->value[11],
|
|
a->value[12], a->value[13], a->value[14], a->value[15],
|
|
a->value[16], a->value[17], a->value[18], a->value[19]);
|
|
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* ib_addr2msg - convert InfiniBand address format to message header format
|
|
*/
|
|
static int ib_addr2msg(struct tipc_media_addr *a, char *msg_area)
|
|
{
|
|
memset(msg_area, 0, TIPC_MEDIA_ADDR_SIZE);
|
|
msg_area[TIPC_MEDIA_TYPE_OFFSET] = TIPC_MEDIA_TYPE_IB;
|
|
memcpy(msg_area, a->value, INFINIBAND_ALEN);
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* ib_msg2addr - convert message header address format to InfiniBand format
|
|
*/
|
|
static int ib_msg2addr(const struct tipc_bearer *tb_ptr,
|
|
struct tipc_media_addr *a, char *msg_area)
|
|
{
|
|
ib_media_addr_set(tb_ptr, a, msg_area);
|
|
return 0;
|
|
}
|
|
|
|
/*
|
|
* InfiniBand media registration info
|
|
*/
|
|
static struct tipc_media ib_media_info = {
|
|
.send_msg = send_msg,
|
|
.enable_bearer = enable_bearer,
|
|
.disable_bearer = disable_bearer,
|
|
.addr2str = ib_addr2str,
|
|
.addr2msg = ib_addr2msg,
|
|
.msg2addr = ib_msg2addr,
|
|
.priority = TIPC_DEF_LINK_PRI,
|
|
.tolerance = TIPC_DEF_LINK_TOL,
|
|
.window = TIPC_DEF_LINK_WIN,
|
|
.type_id = TIPC_MEDIA_TYPE_IB,
|
|
.name = "ib"
|
|
};
|
|
|
|
/**
|
|
* tipc_ib_media_start - activate InfiniBand bearer support
|
|
*
|
|
* Register InfiniBand media type with TIPC bearer code. Also register
|
|
* with OS for notifications about device state changes.
|
|
*/
|
|
int tipc_ib_media_start(void)
|
|
{
|
|
int res;
|
|
|
|
if (ib_started)
|
|
return -EINVAL;
|
|
|
|
res = tipc_register_media(&ib_media_info);
|
|
if (res)
|
|
return res;
|
|
|
|
res = register_netdevice_notifier(¬ifier);
|
|
if (!res)
|
|
ib_started = 1;
|
|
return res;
|
|
}
|
|
|
|
/**
|
|
* tipc_ib_media_stop - deactivate InfiniBand bearer support
|
|
*/
|
|
void tipc_ib_media_stop(void)
|
|
{
|
|
if (!ib_started)
|
|
return;
|
|
|
|
flush_scheduled_work();
|
|
unregister_netdevice_notifier(¬ifier);
|
|
ib_started = 0;
|
|
}
|