37cb062007
TIPC is currently using the field 'af_packet_priv' in struct net_device as a handle to find the bearer instance associated to the given network device. But, by doing so it is blocking other networking cleanups, such as the one discussed here: http://patchwork.ozlabs.org/patch/178044/ This commit removes this usage from TIPC. Instead, we introduce a new field, 'tipc_ptr', to the net_device structure, to serve this purpose. When TIPC bearer is enabled, the bearer object is associated to 'tipc_ptr'. When a TIPC packet arrives in the recv_msg() upcall from a networking device, the bearer object can now be obtained from 'tipc_ptr'. When a bearer is disabled, the bearer object is detached from its underlying network device by setting 'tipc_ptr' to NULL. Additionally, an RCU lock is used to protect the new pointer. Henceforth, the existing tipc_net_lock is used in write mode to serialize write accesses to this pointer, while the new RCU lock is applied on the read side to ensure that the pointer is 100% valid within its wrapped area for all readers. Signed-off-by: Ying Xue <ying.xue@windriver.com> Cc: Patrick McHardy <kaber@trash.net> Reviewed-by: Paul Gortmaker <paul.gortmaker@windriver.com> Signed-off-by: Jon Maloy <jon.maloy@ericsson.com> Signed-off-by: David S. Miller <davem@davemloft.net>
366 lines
10 KiB
C
366 lines
10 KiB
C
/*
|
|
* net/tipc/ib_media.c: Infiniband bearer support for TIPC
|
|
*
|
|
* Copyright (c) 2013 Patrick McHardy <kaber@trash.net>
|
|
*
|
|
* Based on eth_media.c, which carries the following copyright notice:
|
|
*
|
|
* Copyright (c) 2001-2007, Ericsson AB
|
|
* Copyright (c) 2005-2008, 2011, Wind River Systems
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions are met:
|
|
*
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* 3. Neither the names of the copyright holders nor the names of its
|
|
* contributors may be used to endorse or promote products derived from
|
|
* this software without specific prior written permission.
|
|
*
|
|
* Alternatively, this software may be distributed under the terms of the
|
|
* GNU General Public License ("GPL") version 2 as published by the Free
|
|
* Software Foundation.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
* POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#include <linux/if_infiniband.h>
|
|
#include "core.h"
|
|
#include "bearer.h"
|
|
|
|
#define MAX_IB_MEDIA MAX_BEARERS
|
|
|
|
/**
|
|
* struct ib_media - Infiniband media data structure
|
|
* @bearer: ptr to associated "generic" bearer structure
|
|
* @dev: ptr to associated Infiniband network device
|
|
* @tipc_packet_type: used in binding TIPC to Infiniband driver
|
|
* @cleanup: work item used when disabling bearer
|
|
*/
|
|
|
|
struct ib_media {
|
|
struct tipc_bearer *bearer;
|
|
struct net_device *dev;
|
|
struct packet_type tipc_packet_type;
|
|
struct work_struct setup;
|
|
struct work_struct cleanup;
|
|
};
|
|
|
|
static struct ib_media ib_media_array[MAX_IB_MEDIA];
|
|
static int ib_started;
|
|
static int recv_msg(struct sk_buff *buf, struct net_device *dev,
|
|
struct packet_type *pt, struct net_device *orig_dev);
|
|
|
|
static struct packet_type tipc_packet_type __read_mostly = {
|
|
.type = __constant_htons(ETH_P_TIPC),
|
|
.func = recv_msg,
|
|
};
|
|
|
|
/**
|
|
* ib_media_addr_set - initialize Infiniband media address structure
|
|
*
|
|
* Media-dependent "value" field stores MAC address in first 6 bytes
|
|
* and zeroes out the remaining bytes.
|
|
*/
|
|
static void ib_media_addr_set(const struct tipc_bearer *tb_ptr,
|
|
struct tipc_media_addr *a, char *mac)
|
|
{
|
|
BUILD_BUG_ON(sizeof(a->value) < INFINIBAND_ALEN);
|
|
memcpy(a->value, mac, INFINIBAND_ALEN);
|
|
a->media_id = TIPC_MEDIA_TYPE_IB;
|
|
a->broadcast = !memcmp(mac, tb_ptr->bcast_addr.value, INFINIBAND_ALEN);
|
|
}
|
|
|
|
/**
|
|
* send_msg - send a TIPC message out over an InfiniBand interface
|
|
*/
|
|
static int send_msg(struct sk_buff *buf, struct tipc_bearer *tb_ptr,
|
|
struct tipc_media_addr *dest)
|
|
{
|
|
struct sk_buff *clone;
|
|
struct net_device *dev;
|
|
int delta;
|
|
|
|
clone = skb_clone(buf, GFP_ATOMIC);
|
|
if (!clone)
|
|
return 0;
|
|
|
|
dev = ((struct ib_media *)(tb_ptr->usr_handle))->dev;
|
|
delta = dev->hard_header_len - skb_headroom(buf);
|
|
|
|
if ((delta > 0) &&
|
|
pskb_expand_head(clone, SKB_DATA_ALIGN(delta), 0, GFP_ATOMIC)) {
|
|
kfree_skb(clone);
|
|
return 0;
|
|
}
|
|
|
|
skb_reset_network_header(clone);
|
|
clone->dev = dev;
|
|
clone->protocol = htons(ETH_P_TIPC);
|
|
dev_hard_header(clone, dev, ETH_P_TIPC, dest->value,
|
|
dev->dev_addr, clone->len);
|
|
dev_queue_xmit(clone);
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* recv_msg - handle incoming TIPC message from an InfiniBand interface
|
|
*
|
|
* Accept only packets explicitly sent to this node, or broadcast packets;
|
|
* ignores packets sent using InfiniBand multicast, and traffic sent to other
|
|
* nodes (which can happen if interface is running in promiscuous mode).
|
|
*/
|
|
static int recv_msg(struct sk_buff *buf, struct net_device *dev,
|
|
struct packet_type *pt, struct net_device *orig_dev)
|
|
{
|
|
struct tipc_bearer *b_ptr;
|
|
|
|
if (!net_eq(dev_net(dev), &init_net)) {
|
|
kfree_skb(buf);
|
|
return NET_RX_DROP;
|
|
}
|
|
|
|
rcu_read_lock();
|
|
b_ptr = rcu_dereference(dev->tipc_ptr);
|
|
if (likely(b_ptr)) {
|
|
if (likely(buf->pkt_type <= PACKET_BROADCAST)) {
|
|
buf->next = NULL;
|
|
tipc_recv_msg(buf, b_ptr);
|
|
rcu_read_unlock();
|
|
return NET_RX_SUCCESS;
|
|
}
|
|
}
|
|
rcu_read_unlock();
|
|
|
|
kfree_skb(buf);
|
|
return NET_RX_DROP;
|
|
}
|
|
|
|
/**
|
|
* setup_bearer - setup association between InfiniBand bearer and interface
|
|
*/
|
|
static void setup_media(struct work_struct *work)
|
|
{
|
|
dev_add_pack(&tipc_packet_type);
|
|
}
|
|
|
|
/**
|
|
* enable_media - attach TIPC bearer to an InfiniBand interface
|
|
*/
|
|
static int enable_media(struct tipc_bearer *tb_ptr)
|
|
{
|
|
struct net_device *dev;
|
|
struct ib_media *ib_ptr = &ib_media_array[0];
|
|
struct ib_media *stop = &ib_media_array[MAX_IB_MEDIA];
|
|
char *driver_name = strchr((const char *)tb_ptr->name, ':') + 1;
|
|
int pending_dev = 0;
|
|
|
|
/* Find unused InfiniBand bearer structure */
|
|
while (ib_ptr->dev) {
|
|
if (!ib_ptr->bearer)
|
|
pending_dev++;
|
|
if (++ib_ptr == stop)
|
|
return pending_dev ? -EAGAIN : -EDQUOT;
|
|
}
|
|
|
|
/* Find device with specified name */
|
|
dev = dev_get_by_name(&init_net, driver_name);
|
|
if (!dev)
|
|
return -ENODEV;
|
|
|
|
/* Create InfiniBand bearer for device */
|
|
ib_ptr->dev = dev;
|
|
INIT_WORK(&ib_ptr->setup, setup_media);
|
|
schedule_work(&ib_ptr->setup);
|
|
|
|
/* Associate TIPC bearer with InfiniBand bearer */
|
|
tb_ptr->dev = dev;
|
|
ib_ptr->bearer = tb_ptr;
|
|
tb_ptr->usr_handle = (void *)ib_ptr;
|
|
memset(tb_ptr->bcast_addr.value, 0, sizeof(tb_ptr->bcast_addr.value));
|
|
memcpy(tb_ptr->bcast_addr.value, dev->broadcast, INFINIBAND_ALEN);
|
|
tb_ptr->bcast_addr.media_id = TIPC_MEDIA_TYPE_IB;
|
|
tb_ptr->bcast_addr.broadcast = 1;
|
|
tb_ptr->mtu = dev->mtu;
|
|
ib_media_addr_set(tb_ptr, &tb_ptr->addr, (char *)dev->dev_addr);
|
|
rcu_assign_pointer(dev->tipc_ptr, tb_ptr);
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* cleanup_bearer - break association between InfiniBand bearer and interface
|
|
*
|
|
* This routine must be invoked from a work queue because it can sleep.
|
|
*/
|
|
static void cleanup_bearer(struct work_struct *work)
|
|
{
|
|
struct ib_media *ib_ptr =
|
|
container_of(work, struct ib_media, cleanup);
|
|
|
|
dev_remove_pack(&tipc_packet_type);
|
|
dev_put(ib_ptr->dev);
|
|
ib_ptr->dev = NULL;
|
|
}
|
|
|
|
/**
|
|
* disable_media - detach TIPC bearer from an InfiniBand interface
|
|
*
|
|
* Mark InfiniBand bearer as inactive so that incoming buffers are thrown away,
|
|
* then get worker thread to complete bearer cleanup. (Can't do cleanup
|
|
* here because cleanup code needs to sleep and caller holds spinlocks.)
|
|
*/
|
|
static void disable_media(struct tipc_bearer *tb_ptr)
|
|
{
|
|
struct ib_media *ib_ptr = (struct ib_media *)tb_ptr->usr_handle;
|
|
|
|
ib_ptr->bearer = NULL;
|
|
INIT_WORK(&ib_ptr->cleanup, cleanup_bearer);
|
|
schedule_work(&ib_ptr->cleanup);
|
|
RCU_INIT_POINTER(tb_ptr->dev->tipc_ptr, NULL);
|
|
}
|
|
|
|
/**
|
|
* recv_notification - handle device updates from OS
|
|
*
|
|
* Change the state of the InfiniBand bearer (if any) associated with the
|
|
* specified device.
|
|
*/
|
|
static int recv_notification(struct notifier_block *nb, unsigned long evt,
|
|
void *ptr)
|
|
{
|
|
struct tipc_bearer *b_ptr;
|
|
struct net_device *dev = netdev_notifier_info_to_dev(ptr);
|
|
|
|
if (!net_eq(dev_net(dev), &init_net))
|
|
return NOTIFY_DONE;
|
|
|
|
rcu_read_lock();
|
|
b_ptr = rcu_dereference(dev->tipc_ptr);
|
|
if (!b_ptr) {
|
|
rcu_read_unlock();
|
|
return NOTIFY_DONE; /* bearer had been disabled */
|
|
}
|
|
|
|
b_ptr->mtu = dev->mtu;
|
|
|
|
switch (evt) {
|
|
case NETDEV_CHANGE:
|
|
if (netif_carrier_ok(dev))
|
|
break;
|
|
case NETDEV_DOWN:
|
|
case NETDEV_CHANGEMTU:
|
|
case NETDEV_CHANGEADDR:
|
|
tipc_reset_bearer(b_ptr);
|
|
break;
|
|
case NETDEV_UNREGISTER:
|
|
case NETDEV_CHANGENAME:
|
|
tipc_disable_bearer(b_ptr->name);
|
|
break;
|
|
}
|
|
rcu_read_unlock();
|
|
|
|
return NOTIFY_OK;
|
|
}
|
|
|
|
static struct notifier_block notifier = {
|
|
.notifier_call = recv_notification,
|
|
.priority = 0,
|
|
};
|
|
|
|
/**
|
|
* ib_addr2str - convert InfiniBand address to string
|
|
*/
|
|
static int ib_addr2str(struct tipc_media_addr *a, char *str_buf, int str_size)
|
|
{
|
|
if (str_size < 60) /* 60 = 19 * strlen("xx:") + strlen("xx\0") */
|
|
return 1;
|
|
|
|
sprintf(str_buf, "%20phC", a->value);
|
|
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* ib_addr2msg - convert InfiniBand address format to message header format
|
|
*/
|
|
static int ib_addr2msg(struct tipc_media_addr *a, char *msg_area)
|
|
{
|
|
memset(msg_area, 0, TIPC_MEDIA_ADDR_SIZE);
|
|
msg_area[TIPC_MEDIA_TYPE_OFFSET] = TIPC_MEDIA_TYPE_IB;
|
|
memcpy(msg_area, a->value, INFINIBAND_ALEN);
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* ib_msg2addr - convert message header address format to InfiniBand format
|
|
*/
|
|
static int ib_msg2addr(const struct tipc_bearer *tb_ptr,
|
|
struct tipc_media_addr *a, char *msg_area)
|
|
{
|
|
ib_media_addr_set(tb_ptr, a, msg_area);
|
|
return 0;
|
|
}
|
|
|
|
/*
|
|
* InfiniBand media registration info
|
|
*/
|
|
struct tipc_media ib_media_info = {
|
|
.send_msg = send_msg,
|
|
.enable_media = enable_media,
|
|
.disable_media = disable_media,
|
|
.addr2str = ib_addr2str,
|
|
.addr2msg = ib_addr2msg,
|
|
.msg2addr = ib_msg2addr,
|
|
.priority = TIPC_DEF_LINK_PRI,
|
|
.tolerance = TIPC_DEF_LINK_TOL,
|
|
.window = TIPC_DEF_LINK_WIN,
|
|
.type_id = TIPC_MEDIA_TYPE_IB,
|
|
.name = "ib"
|
|
};
|
|
|
|
/**
|
|
* tipc_ib_media_start - activate InfiniBand bearer support
|
|
*
|
|
* Register InfiniBand media type with TIPC bearer code. Also register
|
|
* with OS for notifications about device state changes.
|
|
*/
|
|
int tipc_ib_media_start(void)
|
|
{
|
|
int res;
|
|
|
|
if (ib_started)
|
|
return -EINVAL;
|
|
|
|
res = register_netdevice_notifier(¬ifier);
|
|
if (!res)
|
|
ib_started = 1;
|
|
return res;
|
|
}
|
|
|
|
/**
|
|
* tipc_ib_media_stop - deactivate InfiniBand bearer support
|
|
*/
|
|
void tipc_ib_media_stop(void)
|
|
{
|
|
if (!ib_started)
|
|
return;
|
|
|
|
flush_scheduled_work();
|
|
unregister_netdevice_notifier(¬ifier);
|
|
ib_started = 0;
|
|
}
|